初始化项目,由ModelHub XC社区提供模型
Model: bigscience/bloomz-7b1-p3 Source: Original Platform
This commit is contained in:
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "Answer Given options_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.7054930509596293
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='Answer Given options_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "Choose Story Ending_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.7948378557246857
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='Choose Story Ending_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "Generate Ending_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.6366644606221046
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='Generate Ending_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "Novel Correct Ending_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.7782925215089345
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='Novel Correct Ending_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xstory_cloze",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "Story Continuation and Options_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.771012574454004
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='Story Continuation and Options_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "Replace_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5178571428571429
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='test', target_max_length=256, template_config_name='zh', template_name='Replace_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "True or False_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5218253968253969
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='test', target_max_length=256, template_config_name='zh', template_name='True or False_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "does underscore refer to_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.4662698412698413
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='test', target_max_length=256, template_config_name='zh', template_name='does underscore refer to_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "stand for_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.49404761904761907
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='test', target_max_length=256, template_config_name='zh', template_name='stand for_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "Muennighoff/xwinograd",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "underscore refer to_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.44047619047619047
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='test', target_max_length=256, template_config_name='zh', template_name='underscore refer to_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,20 @@
|
||||
dataset,prompt,metric,value
|
||||
xcopa_zh,C1 or C2? premise_zhht,accuracy,0.55
|
||||
xcopa_zh,best_option_zhht,accuracy,0.67
|
||||
xcopa_zh,cause_effect_zhht,accuracy,0.79
|
||||
xcopa_zh,i_am_hesitating_zhht,accuracy,0.77
|
||||
xcopa_zh,plausible_alternatives_zhht,accuracy,0.75
|
||||
xcopa_zh,median,accuracy,0.75
|
||||
xstory_cloze_zh,Answer Given options_zhht,accuracy,0.7054930509596293
|
||||
xstory_cloze_zh,Choose Story Ending_zhht,accuracy,0.7948378557246857
|
||||
xstory_cloze_zh,Generate Ending_zhht,accuracy,0.6366644606221046
|
||||
xstory_cloze_zh,Novel Correct Ending_zhht,accuracy,0.7782925215089345
|
||||
xstory_cloze_zh,Story Continuation and Options_zhht,accuracy,0.771012574454004
|
||||
xstory_cloze_zh,median,accuracy,0.771012574454004
|
||||
xwinograd_zh,Replace_zhht,accuracy,0.5178571428571429
|
||||
xwinograd_zh,True or False_zhht,accuracy,0.5218253968253969
|
||||
xwinograd_zh,does underscore refer to_zhht,accuracy,0.4662698412698413
|
||||
xwinograd_zh,stand for_zhht,accuracy,0.49404761904761907
|
||||
xwinograd_zh,underscore refer to_zhht,accuracy,0.44047619047619047
|
||||
xwinograd_zh,median,accuracy,0.49404761904761907
|
||||
multiple,average,multiple,0.6716867311672077
|
||||
|
File diff suppressed because one or more lines are too long
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "C1 or C2? premise_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.55
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='C1 or C2? premise_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "best_option_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.67
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='best_option_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "cause_effect_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.79
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='cause_effect_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "i_am_hesitating_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.77
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='i_am_hesitating_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "xcopa",
|
||||
"dataset_config_name": "zh",
|
||||
"template_name": "plausible_alternatives_zhht",
|
||||
"evaluation": {
|
||||
"accuracy": 0.75
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='plausible_alternatives_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
Reference in New Issue
Block a user