Safetensors
rt_detr_v2
docling-layout-heron / config.json
nlivathinos's picture
train-DLNv1_DLNv2_WS2013_NoTables (#2)
bdb7099 verified
{
"activation_dropout": 0.0,
"activation_function": "silu",
"anchor_image_size": null,
"architectures": [
"RTDetrV2ForObjectDetection"
],
"attention_dropout": 0.0,
"auxiliary_loss": true,
"backbone": null,
"backbone_config": {
"depths": [
3,
4,
6,
3
],
"downsample_in_bottleneck": false,
"downsample_in_first_stage": false,
"embedding_size": 64,
"hidden_act": "relu",
"hidden_sizes": [
256,
512,
1024,
2048
],
"layer_type": "bottleneck",
"model_type": "rt_detr_resnet",
"num_channels": 3,
"out_features": [
"stage2",
"stage3",
"stage4"
],
"out_indices": [
2,
3,
4
],
"stage_names": [
"stem",
"stage1",
"stage2",
"stage3",
"stage4"
]
},
"backbone_kwargs": null,
"batch_norm_eps": 1e-05,
"box_noise_scale": 1.0,
"d_model": 256,
"decoder_activation_function": "relu",
"decoder_attention_heads": 8,
"decoder_ffn_dim": 1024,
"decoder_in_channels": [
256,
256,
256
],
"decoder_layers": 6,
"decoder_method": "default",
"decoder_n_levels": 3,
"decoder_n_points": 4,
"decoder_offset_scale": 0.5,
"dropout": 0.0,
"encode_proj_layers": [
2
],
"encoder_activation_function": "gelu",
"encoder_attention_heads": 8,
"encoder_ffn_dim": 1024,
"encoder_hidden_dim": 256,
"encoder_in_channels": [
512,
1024,
2048
],
"encoder_layers": 1,
"eos_coefficient": 0.0001,
"eval_size": null,
"feat_strides": [
8,
16,
32
],
"focal_loss_alpha": 0.75,
"focal_loss_gamma": 2.0,
"freeze_backbone_batch_norms": true,
"hidden_expansion": 1.0,
"id2label": {
"0": "Caption",
"1": "Footnote",
"2": "Formula",
"3": "List-item",
"4": "Page-footer",
"5": "Page-header",
"6": "Picture",
"7": "Section-header",
"8": "Table",
"9": "Text",
"10": "Title",
"11": "Document Index",
"12": "Code",
"13": "Checkbox-Selected",
"14": "Checkbox-Unselected",
"15": "Form",
"16": "Key-Value Region"
},
"initializer_bias_prior_prob": null,
"initializer_range": 0.01,
"is_encoder_decoder": true,
"label2id": {
"Caption": 0,
"Checkbox-Selected": 13,
"Checkbox-Unselected": 14,
"Code": 12,
"Document Index": 11,
"Footnote": 1,
"Form": 15,
"Formula": 2,
"Key-Value Region": 16,
"List-item": 3,
"Page-footer": 4,
"Page-header": 5,
"Picture": 6,
"Section-header": 7,
"Table": 8,
"Text": 9,
"Title": 10
},
"label_noise_ratio": 0.5,
"layer_norm_eps": 1e-05,
"learn_initial_query": false,
"matcher_alpha": 0.25,
"matcher_bbox_cost": 5.0,
"matcher_class_cost": 2.0,
"matcher_gamma": 2.0,
"matcher_giou_cost": 2.0,
"model_type": "rt_detr_v2",
"normalize_before": false,
"num_denoising": 100,
"num_feature_levels": 3,
"num_queries": 300,
"positional_encoding_temperature": 10000,
"torch_dtype": "float32",
"transformers_version": "4.53.0.dev0",
"use_focal_loss": true,
"use_pretrained_backbone": false,
"use_timm_backbone": false,
"weight_loss_bbox": 5.0,
"weight_loss_giou": 2.0,
"weight_loss_vfl": 1.0,
"with_box_refine": true
}