初始化项目,由ModelHub XC社区提供模型
Model: bigscience/bloomz-7b1-p3 Source: Original Platform
This commit is contained in:
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "my",
|
||||
"template_name": "Answer Given options",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5056254136333554
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='my', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='Answer Given options', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "my",
|
||||
"template_name": "Choose Story Ending",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5069490403706155
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='my', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='Choose Story Ending', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "my",
|
||||
"template_name": "Generate Ending",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4784910655195235
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='my', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='Generate Ending', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "my",
|
||||
"template_name": "Novel Correct Ending",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5102581072137657
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='my', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='Novel Correct Ending', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "my",
|
||||
"template_name": "Story Continuation and Options",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5062872270019855
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='my', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='Story Continuation and Options', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "Answer Given options",
|
||||
"evaluation": {
|
||||
"accuracy": 0.6406353408338848
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='Answer Given options', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "Choose Story Ending",
|
||||
"evaluation": {
|
||||
"accuracy": 0.6644606221045665
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='Choose Story Ending', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "Generate Ending",
|
||||
"evaluation": {
|
||||
"accuracy": 0.514890800794176
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='Generate Ending', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "Novel Correct Ending",
|
||||
"evaluation": {
|
||||
"accuracy": 0.6393117140966248
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='Novel Correct Ending', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "Story Continuation and Options",
|
||||
"evaluation": {
|
||||
"accuracy": 0.6545334215751158
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='Story Continuation and Options', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "jp",
|
||||
"template_name": "Replace",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5130344108446299
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='jp', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=4, prefixlm=False, split='test', target_max_length=256, template_config_name='en', template_name='Replace', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "jp",
|
||||
"template_name": "True or False",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5036496350364964
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='jp', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=4, prefixlm=False, split='test', target_max_length=256, template_config_name='en', template_name='True or False', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "jp",
|
||||
"template_name": "does underscore refer to",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5192909280500522
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='jp', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=4, prefixlm=False, split='test', target_max_length=256, template_config_name='en', template_name='does underscore refer to', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "jp",
|
||||
"template_name": "stand for",
|
||||
"evaluation": {
|
||||
"accuracy": 0.49635036496350365
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='jp', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=4, prefixlm=False, split='test', target_max_length=256, template_config_name='en', template_name='stand for', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "jp",
|
||||
"template_name": "underscore refer to",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4994786235662148
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='jp', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=4, prefixlm=False, split='test', target_max_length=256, template_config_name='en', template_name='underscore refer to', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "Replace",
|
||||
"evaluation": {
|
||||
"accuracy": 0.49206349206349204
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=4, prefixlm=False, split='test', target_max_length=256, template_config_name='en', template_name='Replace', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "True or False",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4793650793650794
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=4, prefixlm=False, split='test', target_max_length=256, template_config_name='en', template_name='True or False', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "does underscore refer to",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4857142857142857
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=4, prefixlm=False, split='test', target_max_length=256, template_config_name='en', template_name='does underscore refer to', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "stand for",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4888888888888889
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=4, prefixlm=False, split='test', target_max_length=256, template_config_name='en', template_name='stand for', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "underscore refer to",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4857142857142857
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=4, prefixlm=False, split='test', target_max_length=256, template_config_name='en', template_name='underscore refer to', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "et",
|
||||
"template_name": "C1 or C2? premise, so/because\u2026",
|
||||
"evaluation": {
|
||||
"accuracy": 0.47
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='et', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='so/because\u2026,validation', target_max_length=256, template_config_name='en', template_name='C1 or C2? premise', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "et",
|
||||
"template_name": "best_option",
|
||||
"evaluation": {
|
||||
"accuracy": 0.52
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='et', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='best_option', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "et",
|
||||
"template_name": "cause_effect",
|
||||
"evaluation": {
|
||||
"accuracy": 0.49
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='et', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='cause_effect', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "et",
|
||||
"template_name": "i_am_hesitating",
|
||||
"evaluation": {
|
||||
"accuracy": 0.57
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='et', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='i_am_hesitating', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "et",
|
||||
"template_name": "plausible_alternatives",
|
||||
"evaluation": {
|
||||
"accuracy": 0.55
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='et', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='plausible_alternatives', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "ht",
|
||||
"template_name": "C1 or C2? premise, so/because\u2026",
|
||||
"evaluation": {
|
||||
"accuracy": 0.51
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ht', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='so/because\u2026,validation', target_max_length=256, template_config_name='en', template_name='C1 or C2? premise', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "ht",
|
||||
"template_name": "best_option",
|
||||
"evaluation": {
|
||||
"accuracy": 0.47
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ht', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='best_option', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "ht",
|
||||
"template_name": "cause_effect",
|
||||
"evaluation": {
|
||||
"accuracy": 0.55
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ht', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='cause_effect', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "ht",
|
||||
"template_name": "i_am_hesitating",
|
||||
"evaluation": {
|
||||
"accuracy": 0.51
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ht', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='i_am_hesitating', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "ht",
|
||||
"template_name": "plausible_alternatives",
|
||||
"evaluation": {
|
||||
"accuracy": 0.52
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ht', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='plausible_alternatives', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "it",
|
||||
"template_name": "C1 or C2? premise, so/because\u2026",
|
||||
"evaluation": {
|
||||
"accuracy": 0.57
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='it', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='so/because\u2026,validation', target_max_length=256, template_config_name='en', template_name='C1 or C2? premise', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "it",
|
||||
"template_name": "best_option",
|
||||
"evaluation": {
|
||||
"accuracy": 0.52
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='it', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='best_option', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "it",
|
||||
"template_name": "cause_effect",
|
||||
"evaluation": {
|
||||
"accuracy": 0.54
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='it', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='cause_effect', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "it",
|
||||
"template_name": "i_am_hesitating",
|
||||
"evaluation": {
|
||||
"accuracy": 0.57
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='it', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='i_am_hesitating', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "it",
|
||||
"template_name": "plausible_alternatives",
|
||||
"evaluation": {
|
||||
"accuracy": 0.6
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='it', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='plausible_alternatives', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "qu",
|
||||
"template_name": "C1 or C2? premise, so/because\u2026",
|
||||
"evaluation": {
|
||||
"accuracy": 0.47
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='qu', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='so/because\u2026,validation', target_max_length=256, template_config_name='en', template_name='C1 or C2? premise', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "qu",
|
||||
"template_name": "best_option",
|
||||
"evaluation": {
|
||||
"accuracy": 0.52
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='qu', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='best_option', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "qu",
|
||||
"template_name": "cause_effect",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='qu', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='cause_effect', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "qu",
|
||||
"template_name": "i_am_hesitating",
|
||||
"evaluation": {
|
||||
"accuracy": 0.48
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='qu', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='i_am_hesitating', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "qu",
|
||||
"template_name": "plausible_alternatives",
|
||||
"evaluation": {
|
||||
"accuracy": 0.54
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='qu', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='plausible_alternatives', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "tr",
|
||||
"template_name": "C1 or C2? premise, so/because\u2026",
|
||||
"evaluation": {
|
||||
"accuracy": 0.55
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='tr', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='so/because\u2026,validation', target_max_length=256, template_config_name='en', template_name='C1 or C2? premise', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "tr",
|
||||
"template_name": "best_option",
|
||||
"evaluation": {
|
||||
"accuracy": 0.48
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='tr', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='best_option', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "tr",
|
||||
"template_name": "cause_effect",
|
||||
"evaluation": {
|
||||
"accuracy": 0.53
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='tr', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='cause_effect', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "tr",
|
||||
"template_name": "i_am_hesitating",
|
||||
"evaluation": {
|
||||
"accuracy": 0.54
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='tr', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='i_am_hesitating', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "tr",
|
||||
"template_name": "plausible_alternatives",
|
||||
"evaluation": {
|
||||
"accuracy": 0.52
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='tr', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='plausible_alternatives', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "bg",
|
||||
"template_name": "GPT-3 style",
|
||||
"evaluation": {
|
||||
"accuracy": 0.43775100401606426
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='bg', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='GPT-3 style', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "bg",
|
||||
"template_name": "MNLI crowdsource",
|
||||
"evaluation": {
|
||||
"accuracy": 0.36666666666666664
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='bg', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='MNLI crowdsource', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "bg",
|
||||
"template_name": "can we infer",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4397590361445783
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='bg', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='can we infer', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "bg",
|
||||
"template_name": "guaranteed/possible/impossible",
|
||||
"evaluation": {
|
||||
"accuracy": 0.41646586345381525
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='bg', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='guaranteed/possible/impossible', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "bg",
|
||||
"template_name": "justified in saying",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4108433734939759
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='bg', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='justified in saying', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "de",
|
||||
"template_name": "GPT-3 style",
|
||||
"evaluation": {
|
||||
"accuracy": 0.470281124497992
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='de', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='GPT-3 style', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "de",
|
||||
"template_name": "MNLI crowdsource",
|
||||
"evaluation": {
|
||||
"accuracy": 0.3586345381526104
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='de', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='MNLI crowdsource', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "de",
|
||||
"template_name": "can we infer",
|
||||
"evaluation": {
|
||||
"accuracy": 0.44016064257028115
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='de', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='can we infer', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "de",
|
||||
"template_name": "guaranteed/possible/impossible",
|
||||
"evaluation": {
|
||||
"accuracy": 0.3538152610441767
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='de', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='guaranteed/possible/impossible', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "de",
|
||||
"template_name": "justified in saying",
|
||||
"evaluation": {
|
||||
"accuracy": 0.41847389558232934
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='de', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='justified in saying', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "el",
|
||||
"template_name": "GPT-3 style",
|
||||
"evaluation": {
|
||||
"accuracy": 0.41887550200803214
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='el', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='GPT-3 style', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "el",
|
||||
"template_name": "MNLI crowdsource",
|
||||
"evaluation": {
|
||||
"accuracy": 0.3598393574297189
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='el', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='MNLI crowdsource', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "el",
|
||||
"template_name": "can we infer",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4108433734939759
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='el', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='can we infer', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "el",
|
||||
"template_name": "guaranteed/possible/impossible",
|
||||
"evaluation": {
|
||||
"accuracy": 0.40682730923694777
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='el', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='guaranteed/possible/impossible', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "el",
|
||||
"template_name": "justified in saying",
|
||||
"evaluation": {
|
||||
"accuracy": 0.3823293172690763
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='el', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='justified in saying', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "GPT-3 style",
|
||||
"evaluation": {
|
||||
"accuracy": 0.46546184738955826
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='GPT-3 style', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "MNLI crowdsource",
|
||||
"evaluation": {
|
||||
"accuracy": 0.3819277108433735
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='MNLI crowdsource', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "can we infer",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4614457831325301
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='can we infer', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "guaranteed/possible/impossible",
|
||||
"evaluation": {
|
||||
"accuracy": 0.42208835341365464
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='guaranteed/possible/impossible', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "ru",
|
||||
"template_name": "justified in saying",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4389558232931727
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='ru', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='justified in saying', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "th",
|
||||
"template_name": "GPT-3 style",
|
||||
"evaluation": {
|
||||
"accuracy": 0.41646586345381525
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='th', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='GPT-3 style', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "th",
|
||||
"template_name": "MNLI crowdsource",
|
||||
"evaluation": {
|
||||
"accuracy": 0.3224899598393574
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='th', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='MNLI crowdsource', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "th",
|
||||
"template_name": "can we infer",
|
||||
"evaluation": {
|
||||
"accuracy": 0.43172690763052207
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='th', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='can we infer', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "th",
|
||||
"template_name": "guaranteed/possible/impossible",
|
||||
"evaluation": {
|
||||
"accuracy": 0.42730923694779116
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='th', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='guaranteed/possible/impossible', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "th",
|
||||
"template_name": "justified in saying",
|
||||
"evaluation": {
|
||||
"accuracy": 0.40401606425702813
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='th', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='justified in saying', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "tr",
|
||||
"template_name": "GPT-3 style",
|
||||
"evaluation": {
|
||||
"accuracy": 0.40240963855421685
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='tr', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='GPT-3 style', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "tr",
|
||||
"template_name": "MNLI crowdsource",
|
||||
"evaluation": {
|
||||
"accuracy": 0.351004016064257
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='tr', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='MNLI crowdsource', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "tr",
|
||||
"template_name": "can we infer",
|
||||
"evaluation": {
|
||||
"accuracy": 0.40441767068273093
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='tr', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='can we infer', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "tr",
|
||||
"template_name": "guaranteed/possible/impossible",
|
||||
"evaluation": {
|
||||
"accuracy": 0.3678714859437751
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='tr', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='guaranteed/possible/impossible', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xnli",
|
||||
"dataset_config_name": "tr",
|
||||
"template_name": "justified in saying",
|
||||
"evaluation": {
|
||||
"accuracy": 0.38313253012048193
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='tr', dataset_name='xnli', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3', nospace=False, output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/bloomz-7b1-p3/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='en', template_name='justified in saying', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
Reference in New Issue
Block a user