{ "module": "keras_hub.src.models.d_fine.d_fine_backbone", "class_name": "DFineBackbone", "config": { "name": "d_fine_backbone", "trainable": true, "backbone": { "module": "keras_hub.src.models.hgnetv2.hgnetv2_backbone", "class_name": "HGNetV2Backbone", "config": { "name": "hg_net_v2_backbone", "trainable": true, "depths": [ 3, 4, 6, 3 ], "embedding_size": 32, "hidden_sizes": [ 128, 256, 512, 1024 ], "stem_channels": [ 3, 16, 16 ], "hidden_act": "relu", "use_learnable_affine_block": true, "stackwise_stage_filters": [ [ 16, 16, 64, 1, 3, 3 ], [ 64, 32, 256, 1, 3, 3 ], [ 256, 64, 512, 2, 3, 5 ], [ 512, 128, 1024, 1, 3, 5 ] ], "apply_downsample": [ false, true, true, true ], "use_lightweight_conv_block": [ false, false, true, true ], "image_shape": [ null, null, 3 ], "out_features": [ "stage2", "stage3", "stage4" ], "data_format": "channels_last" }, "registered_name": "keras_hub>HGNetV2Backbone" }, "decoder_in_channels": [ 256, 256, 256 ], "encoder_hidden_dim": 256, "num_labels": 80, "num_denoising": 100, "learn_initial_query": false, "num_queries": 300, "anchor_image_size": [ 640, 640 ], "feat_strides": [ 8, 16, 32 ], "num_feature_levels": 3, "hidden_dim": 256, "encoder_in_channels": [ 256, 512, 1024 ], "encode_proj_layers": [ 2 ], "num_attention_heads": 8, "encoder_ffn_dim": 1024, "num_encoder_layers": 1, "hidden_expansion": 0.5, "depth_multiplier": 0.34, "eval_idx": -1, "box_noise_scale": 1.0, "label_noise_ratio": 0.5, "labels": null, "num_decoder_layers": 3, "decoder_attention_heads": 8, "decoder_ffn_dim": 1024, "decoder_method": "default", "decoder_n_points": [ 3, 6, 3 ], "lqe_hidden_dim": 64, "num_lqe_layers": 2, "seed": 0, "image_shape": [ null, null, 3 ], "data_format": "channels_last", "out_features": [ "stage2", "stage3", "stage4" ] }, "registered_name": "keras_hub>DFineBackbone" }