初始化项目,由ModelHub XC社区提供模型

Model: bigscience/bloomz-7b1-p3
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-06-15 07:40:14 +08:00
commit 78a6661ff1
634 changed files with 7477 additions and 0 deletions

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "Muennighoff/xstory_cloze",
"dataset_config_name": "zh",
"template_name": "Answer Given options_zhht",
"evaluation": {
"accuracy": 0.7054930509596293
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='Answer Given options_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "Muennighoff/xstory_cloze",
"dataset_config_name": "zh",
"template_name": "Choose Story Ending_zhht",
"evaluation": {
"accuracy": 0.7948378557246857
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='Choose Story Ending_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "Muennighoff/xstory_cloze",
"dataset_config_name": "zh",
"template_name": "Generate Ending_zhht",
"evaluation": {
"accuracy": 0.6366644606221046
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='Generate Ending_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "Muennighoff/xstory_cloze",
"dataset_config_name": "zh",
"template_name": "Novel Correct Ending_zhht",
"evaluation": {
"accuracy": 0.7782925215089345
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='Novel Correct Ending_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "Muennighoff/xstory_cloze",
"dataset_config_name": "zh",
"template_name": "Story Continuation and Options_zhht",
"evaluation": {
"accuracy": 0.771012574454004
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xstory_cloze', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='Story Continuation and Options_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "Muennighoff/xwinograd",
"dataset_config_name": "zh",
"template_name": "Replace_zhht",
"evaluation": {
"accuracy": 0.5178571428571429
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='test', target_max_length=256, template_config_name='zh', template_name='Replace_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "Muennighoff/xwinograd",
"dataset_config_name": "zh",
"template_name": "True or False_zhht",
"evaluation": {
"accuracy": 0.5218253968253969
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='test', target_max_length=256, template_config_name='zh', template_name='True or False_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "Muennighoff/xwinograd",
"dataset_config_name": "zh",
"template_name": "does underscore refer to_zhht",
"evaluation": {
"accuracy": 0.4662698412698413
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='test', target_max_length=256, template_config_name='zh', template_name='does underscore refer to_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "Muennighoff/xwinograd",
"dataset_config_name": "zh",
"template_name": "stand for_zhht",
"evaluation": {
"accuracy": 0.49404761904761907
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='test', target_max_length=256, template_config_name='zh', template_name='stand for_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "Muennighoff/xwinograd",
"dataset_config_name": "zh",
"template_name": "underscore refer to_zhht",
"evaluation": {
"accuracy": 0.44047619047619047
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='Muennighoff/xwinograd', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='test', target_max_length=256, template_config_name='zh', template_name='underscore refer to_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,20 @@
dataset,prompt,metric,value
xcopa_zh,C1 or C2? premise_zhht,accuracy,0.55
xcopa_zh,best_option_zhht,accuracy,0.67
xcopa_zh,cause_effect_zhht,accuracy,0.79
xcopa_zh,i_am_hesitating_zhht,accuracy,0.77
xcopa_zh,plausible_alternatives_zhht,accuracy,0.75
xcopa_zh,median,accuracy,0.75
xstory_cloze_zh,Answer Given options_zhht,accuracy,0.7054930509596293
xstory_cloze_zh,Choose Story Ending_zhht,accuracy,0.7948378557246857
xstory_cloze_zh,Generate Ending_zhht,accuracy,0.6366644606221046
xstory_cloze_zh,Novel Correct Ending_zhht,accuracy,0.7782925215089345
xstory_cloze_zh,Story Continuation and Options_zhht,accuracy,0.771012574454004
xstory_cloze_zh,median,accuracy,0.771012574454004
xwinograd_zh,Replace_zhht,accuracy,0.5178571428571429
xwinograd_zh,True or False_zhht,accuracy,0.5218253968253969
xwinograd_zh,does underscore refer to_zhht,accuracy,0.4662698412698413
xwinograd_zh,stand for_zhht,accuracy,0.49404761904761907
xwinograd_zh,underscore refer to_zhht,accuracy,0.44047619047619047
xwinograd_zh,median,accuracy,0.49404761904761907
multiple,average,multiple,0.6716867311672077
1 dataset prompt metric value
2 xcopa_zh C1 or C2? premise_zhht accuracy 0.55
3 xcopa_zh best_option_zhht accuracy 0.67
4 xcopa_zh cause_effect_zhht accuracy 0.79
5 xcopa_zh i_am_hesitating_zhht accuracy 0.77
6 xcopa_zh plausible_alternatives_zhht accuracy 0.75
7 xcopa_zh median accuracy 0.75
8 xstory_cloze_zh Answer Given options_zhht accuracy 0.7054930509596293
9 xstory_cloze_zh Choose Story Ending_zhht accuracy 0.7948378557246857
10 xstory_cloze_zh Generate Ending_zhht accuracy 0.6366644606221046
11 xstory_cloze_zh Novel Correct Ending_zhht accuracy 0.7782925215089345
12 xstory_cloze_zh Story Continuation and Options_zhht accuracy 0.771012574454004
13 xstory_cloze_zh median accuracy 0.771012574454004
14 xwinograd_zh Replace_zhht accuracy 0.5178571428571429
15 xwinograd_zh True or False_zhht accuracy 0.5218253968253969
16 xwinograd_zh does underscore refer to_zhht accuracy 0.4662698412698413
17 xwinograd_zh stand for_zhht accuracy 0.49404761904761907
18 xwinograd_zh underscore refer to_zhht accuracy 0.44047619047619047
19 xwinograd_zh median accuracy 0.49404761904761907
20 multiple average multiple 0.6716867311672077

File diff suppressed because one or more lines are too long

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "xcopa",
"dataset_config_name": "zh",
"template_name": "C1 or C2? premise_zhht",
"evaluation": {
"accuracy": 0.55
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='C1 or C2? premise_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "xcopa",
"dataset_config_name": "zh",
"template_name": "best_option_zhht",
"evaluation": {
"accuracy": 0.67
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='best_option_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "xcopa",
"dataset_config_name": "zh",
"template_name": "cause_effect_zhht",
"evaluation": {
"accuracy": 0.79
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='cause_effect_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "xcopa",
"dataset_config_name": "zh",
"template_name": "i_am_hesitating_zhht",
"evaluation": {
"accuracy": 0.77
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='i_am_hesitating_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}

View File

@@ -0,0 +1,9 @@
{
"dataset_name": "xcopa",
"dataset_config_name": "zh",
"template_name": "plausible_alternatives_zhht",
"evaluation": {
"accuracy": 0.75
},
"arguments": "Namespace(config_name=None, dataset_config_name='zh', dataset_name='xcopa', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name='zh', template_name='plausible_alternatives_zhht', tokenizer_name=None, use_slow_tokenizer=False)"
}