InterpBench / benchmark_metadata_croissant.json
cybershiptrooper's picture
Update metadata (#5)
c0a69c0 verified
raw
history blame
No virus
40.2 kB
{
"@context": {
"@language": "en",
"@vocab": "https://schema.org/",
"citeAs": "cr:citeAs",
"column": "cr:column",
"conformsTo": "dct:conformsTo",
"cr": "http://mlcommons.org/croissant/",
"rai": "http://mlcommons.org/croissant/RAI/",
"data": {
"@id": "cr:data",
"@type": "@json"
},
"dataType": {
"@id": "cr:dataType",
"@type": "@vocab"
},
"dct": "http://purl.org/dc/terms/",
"examples": {
"@id": "cr:examples",
"@type": "@json"
},
"extract": "cr:extract",
"field": "cr:field",
"fileProperty": "cr:fileProperty",
"fileObject": "cr:fileObject",
"fileSet": "cr:fileSet",
"format": "cr:format",
"includes": "cr:includes",
"isLiveDataset": "cr:isLiveDataset",
"jsonPath": "cr:jsonPath",
"key": "cr:key",
"md5": "cr:md5",
"parentField": "cr:parentField",
"path": "cr:path",
"recordSet": "cr:recordSet",
"references": "cr:references",
"regex": "cr:regex",
"repeated": "cr:repeated",
"replace": "cr:replace",
"sc": "https://schema.org/",
"separator": "cr:separator",
"source": "cr:source",
"subField": "cr:subField",
"transform": "cr:transform"
},
"@type": "sc:Dataset",
"name": "InterpBench",
"description": "A benchmark of transformers with known circuits for evaluating mechanistic interpretability techniques.",
"conformsTo": "http://mlcommons.org/croissant/1.0",
"license": "https://creativecommons.org/licenses/by/4.0/",
"url": "https://huggingface.co/cybershiptrooper/InterpBench",
"version": "1.0.0",
"distribution": [
{
"@type": "cr:FileObject",
"@id": "hf-repository",
"name": "hf-repository",
"description": "The Hugging Face git repository.",
"contentUrl": "https://huggingface.co/cybershiptrooper/InterpBench",
"encodingFormat": "git+https",
"sha256": "main"
},
{
"@type": "cr:FileObject",
"@id": "benchmark-cases-parquet",
"name": "benchmark-cases-parquet",
"description": "Parquet file describing all the cases in the benchmark.",
"containedIn": {
"@id": "hf-repository"
},
"encodingFormat": "application/x-parquet"
},
{
"@type": "cr:FileSet",
"@id": "training-args",
"name": "training-args",
"description": "Training arguments.",
"containedIn": {
"@id": "hf-repository"
},
"encodingFormat": "application/json",
"includes": "*/meta_[0-9]*.json"
},
{
"@type": "cr:FileSet",
"@id": "circuits",
"name": "circuits",
"description": "Ground truth circuits (Pickle).",
"containedIn": {
"@id": "hf-repository"
},
"encodingFormat": "application/octet-stream",
"includes": "*/edges.pkl"
},
{
"@type": "cr:FileSet",
"@id": "weights",
"name": "weights",
"description": "Serialized PyTorch state dictionaries (Pickle).",
"containedIn": {
"@id": "hf-repository"
},
"encodingFormat": "application/octet-stream",
"includes": "*/ll_model_[0-9]*.pkl"
},
{
"@type": "cr:FileSet",
"@id": "cfgs",
"name": "cfgs",
"description": "Architecture configs (Pickle).",
"containedIn": {
"@id": "hf-repository"
},
"encodingFormat": "application/octet-stream",
"includes": "*/ll_model_cfg_[0-9]*.pkl"
}
],
"recordSet": [
{
"@type": "cr:RecordSet",
"@id": "cases",
"name": "cases",
"field": [
{
"@type": "cr:Field",
"@id": "case_id",
"name": "case_id",
"description": "Column 'case_id' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "case_id"
}
}
},
{
"@type": "cr:Field",
"@id": "url",
"name": "url",
"description": "Column 'url' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "url"
}
}
},
{
"@type": "cr:Field",
"@id": "task_description",
"name": "task_description",
"description": "Column 'task_description' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "task_description"
}
}
},
{
"@type": "cr:Field",
"@id": "max_seq_len",
"name": "max_seq_len",
"description": "Column 'max_seq_len' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "max_seq_len"
}
}
},
{
"@type": "cr:Field",
"@id": "min_seq_len",
"name": "min_seq_len",
"description": "Column 'min_seq_len' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "min_seq_len"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg_file_url",
"name": "transformer_cfg_file_url",
"description": "Column 'transformer_cfg_file_url' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg_file_url"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args_file_url",
"name": "training_args_file_url",
"description": "Column 'training_args_file_url' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args_file_url"
}
}
},
{
"@type": "cr:Field",
"@id": "weights_file_url",
"name": "weights_file_url",
"description": "Column 'weights_file_url' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "weights_file_url"
}
}
},
{
"@type": "cr:Field",
"@id": "circuit_file_url",
"name": "circuit_file_url",
"description": "Column 'circuit_file_url' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "circuit_file_url"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.atol",
"name": "training_args.atol",
"description": "Column 'training_args.atol' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.atol"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.lr",
"name": "training_args.lr",
"description": "Column 'training_args.lr' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.lr"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.use_single_loss",
"name": "training_args.use_single_loss",
"description": "Column 'training_args.use_single_loss' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.use_single_loss"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.iit_weight",
"name": "training_args.iit_weight",
"description": "Column 'training_args.iit_weight' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.iit_weight"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.behavior_weight",
"name": "training_args.behavior_weight",
"description": "Column 'training_args.behavior_weight' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.behavior_weight"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.strict_weight",
"name": "training_args.strict_weight",
"description": "Column 'training_args.strict_weight' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.strict_weight"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.epochs",
"name": "training_args.epochs",
"description": "Column 'training_args.epochs' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.epochs"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.act_fn",
"name": "training_args.act_fn",
"description": "Column 'training_args.act_fn' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.act_fn"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.clip_grad_norm",
"name": "training_args.clip_grad_norm",
"description": "Column 'training_args.clip_grad_norm' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.clip_grad_norm"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.lr_scheduler",
"name": "training_args.lr_scheduler",
"description": "Column 'training_args.lr_scheduler' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.lr_scheduler"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.n_layers",
"name": "transformer_cfg.n_layers",
"description": "Column 'transformer_cfg.n_layers' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.n_layers"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.d_model",
"name": "transformer_cfg.d_model",
"description": "Column 'transformer_cfg.d_model' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.d_model"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.n_ctx",
"name": "transformer_cfg.n_ctx",
"description": "Column 'transformer_cfg.n_ctx' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.n_ctx"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.d_head",
"name": "transformer_cfg.d_head",
"description": "Column 'transformer_cfg.d_head' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.d_head"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.model_name",
"name": "transformer_cfg.model_name",
"description": "Column 'transformer_cfg.model_name' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.model_name"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.n_heads",
"name": "transformer_cfg.n_heads",
"description": "Column 'transformer_cfg.n_heads' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.n_heads"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.d_mlp",
"name": "transformer_cfg.d_mlp",
"description": "Column 'transformer_cfg.d_mlp' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.d_mlp"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.act_fn",
"name": "transformer_cfg.act_fn",
"description": "Column 'transformer_cfg.act_fn' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.act_fn"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.d_vocab",
"name": "transformer_cfg.d_vocab",
"description": "Column 'transformer_cfg.d_vocab' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.d_vocab"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.eps",
"name": "transformer_cfg.eps",
"description": "Column 'transformer_cfg.eps' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.eps"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.use_attn_result",
"name": "transformer_cfg.use_attn_result",
"description": "Column 'transformer_cfg.use_attn_result' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.use_attn_result"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.use_attn_scale",
"name": "transformer_cfg.use_attn_scale",
"description": "Column 'transformer_cfg.use_attn_scale' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.use_attn_scale"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.use_split_qkv_input",
"name": "transformer_cfg.use_split_qkv_input",
"description": "Column 'transformer_cfg.use_split_qkv_input' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.use_split_qkv_input"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.use_hook_mlp_in",
"name": "transformer_cfg.use_hook_mlp_in",
"description": "Column 'transformer_cfg.use_hook_mlp_in' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.use_hook_mlp_in"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.use_attn_in",
"name": "transformer_cfg.use_attn_in",
"description": "Column 'transformer_cfg.use_attn_in' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.use_attn_in"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.use_local_attn",
"name": "transformer_cfg.use_local_attn",
"description": "Column 'transformer_cfg.use_local_attn' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.use_local_attn"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.original_architecture",
"name": "transformer_cfg.original_architecture",
"description": "Column 'transformer_cfg.original_architecture' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.original_architecture"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.from_checkpoint",
"name": "transformer_cfg.from_checkpoint",
"description": "Column 'transformer_cfg.from_checkpoint' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.from_checkpoint"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.tokenizer_name",
"name": "transformer_cfg.tokenizer_name",
"description": "Column 'transformer_cfg.tokenizer_name' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.tokenizer_name"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.init_mode",
"name": "transformer_cfg.init_mode",
"description": "Column 'transformer_cfg.init_mode' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.init_mode"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.normalization_type",
"name": "transformer_cfg.normalization_type",
"description": "Column 'transformer_cfg.normalization_type' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.normalization_type"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.n_devices",
"name": "transformer_cfg.n_devices",
"description": "Column 'transformer_cfg.n_devices' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.n_devices"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.attention_dir",
"name": "transformer_cfg.attention_dir",
"description": "Column 'transformer_cfg.attention_dir' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.attention_dir"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.attn_only",
"name": "transformer_cfg.attn_only",
"description": "Column 'transformer_cfg.attn_only' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.attn_only"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.seed",
"name": "transformer_cfg.seed",
"description": "Column 'transformer_cfg.seed' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.seed"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.initializer_range",
"name": "transformer_cfg.initializer_range",
"description": "Column 'transformer_cfg.initializer_range' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.initializer_range"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.init_weights",
"name": "transformer_cfg.init_weights",
"description": "Column 'transformer_cfg.init_weights' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.init_weights"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.scale_attn_by_inverse_layer_idx",
"name": "transformer_cfg.scale_attn_by_inverse_layer_idx",
"description": "Column 'transformer_cfg.scale_attn_by_inverse_layer_idx' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.scale_attn_by_inverse_layer_idx"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.positional_embedding_type",
"name": "transformer_cfg.positional_embedding_type",
"description": "Column 'transformer_cfg.positional_embedding_type' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.positional_embedding_type"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.final_rms",
"name": "transformer_cfg.final_rms",
"description": "Column 'transformer_cfg.final_rms' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.final_rms"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.d_vocab_out",
"name": "transformer_cfg.d_vocab_out",
"description": "Column 'transformer_cfg.d_vocab_out' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.d_vocab_out"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.parallel_attn_mlp",
"name": "transformer_cfg.parallel_attn_mlp",
"description": "Column 'transformer_cfg.parallel_attn_mlp' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.parallel_attn_mlp"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.n_params",
"name": "transformer_cfg.n_params",
"description": "Column 'transformer_cfg.n_params' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.n_params"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.use_hook_tokens",
"name": "transformer_cfg.use_hook_tokens",
"description": "Column 'transformer_cfg.use_hook_tokens' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.use_hook_tokens"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.gated_mlp",
"name": "transformer_cfg.gated_mlp",
"description": "Column 'transformer_cfg.gated_mlp' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.gated_mlp"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.default_prepend_bos",
"name": "transformer_cfg.default_prepend_bos",
"description": "Column 'transformer_cfg.default_prepend_bos' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.default_prepend_bos"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.dtype",
"name": "transformer_cfg.dtype",
"description": "Column 'transformer_cfg.dtype' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.dtype"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.tokenizer_prepends_bos",
"name": "transformer_cfg.tokenizer_prepends_bos",
"description": "Column 'transformer_cfg.tokenizer_prepends_bos' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.tokenizer_prepends_bos"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.post_embedding_ln",
"name": "transformer_cfg.post_embedding_ln",
"description": "Column 'transformer_cfg.post_embedding_ln' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.post_embedding_ln"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.rotary_base",
"name": "transformer_cfg.rotary_base",
"description": "Column 'transformer_cfg.rotary_base' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Integer",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.rotary_base"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.trust_remote_code",
"name": "transformer_cfg.trust_remote_code",
"description": "Column 'transformer_cfg.trust_remote_code' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.trust_remote_code"
}
}
},
{
"@type": "cr:Field",
"@id": "transformer_cfg.rotary_adjacent_pairs",
"name": "transformer_cfg.rotary_adjacent_pairs",
"description": "Column 'transformer_cfg.rotary_adjacent_pairs' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "transformer_cfg.rotary_adjacent_pairs"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.model_pair",
"name": "training_args.model_pair",
"description": "Column 'training_args.model_pair' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.model_pair"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.next_token",
"name": "training_args.next_token",
"description": "Column 'training_args.next_token' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.next_token"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.non_ioi_thresh",
"name": "training_args.non_ioi_thresh",
"description": "Column 'training_args.non_ioi_thresh' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.non_ioi_thresh"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.use_per_token_check",
"name": "training_args.use_per_token_check",
"description": "Column 'training_args.use_per_token_check' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.use_per_token_check"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.batch_size",
"name": "training_args.batch_size",
"description": "Column 'training_args.batch_size' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.batch_size"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.num_workers",
"name": "training_args.num_workers",
"description": "Column 'training_args.num_workers' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Float",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.num_workers"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.early_stop",
"name": "training_args.early_stop",
"description": "Column 'training_args.early_stop' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Boolean",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.early_stop"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.scheduler_val_metric",
"name": "training_args.scheduler_val_metric",
"description": "Column 'training_args.scheduler_val_metric' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.scheduler_val_metric"
}
}
},
{
"@type": "cr:Field",
"@id": "training_args.scheduler_mode",
"name": "training_args.scheduler_mode",
"description": "Column 'training_args.scheduler_mode' from the parquet file describing all the cases in the benchmark.",
"dataType": "sc:Text",
"source": {
"fileSet": {
"@id": "benchmark-cases-parquet"
},
"extract": {
"column": "training_args.scheduler_mode"
}
}
}
]
}
]
}