()
| 31 | |
| 32 | |
| 33 | def get_args_parser(): |
| 34 | parser = argparse.ArgumentParser('Deformable DETR Detector', add_help=False) |
| 35 | parser.add_argument('--lr', default=2e-4, type=float) |
| 36 | parser.add_argument('--lr_backbone_names', default=["backbone.0"], type=str, nargs='+') |
| 37 | parser.add_argument('--lr_backbone', default=2e-5, type=float) |
| 38 | parser.add_argument('--lr_linear_proj_names', default=['reference_points', 'sampling_offsets'], type=str, nargs='+') |
| 39 | parser.add_argument('--lr_linear_proj_mult', default=0.1, type=float) |
| 40 | parser.add_argument('--batch_size', default=1, type=int) |
| 41 | parser.add_argument('--weight_decay', default=1e-4, type=float) |
| 42 | parser.add_argument('--epochs', default=50, type=int) |
| 43 | parser.add_argument('--lr_drop', default=40, type=int) |
| 44 | parser.add_argument('--lr_drop_epochs', default=None, type=int, nargs='+') |
| 45 | parser.add_argument('--clip_max_norm', default=0.1, type=float, |
| 46 | help='gradient clipping max norm') |
| 47 | |
| 48 | parser.add_argument('--sgd', action='store_true') |
| 49 | |
| 50 | # Variants of Deformable DETR |
| 51 | parser.add_argument('--with_box_refine', default=True, action='store_true') |
| 52 | parser.add_argument('--two_stage', default=False, action='store_true') |
| 53 | |
| 54 | # Model parameters |
| 55 | parser.add_argument('--frozen_weights', type=str, default=None, |
| 56 | help="Path to the pretrained model. If set, only the mask head will be trained") |
| 57 | |
| 58 | # * Backbone |
| 59 | parser.add_argument('--backbone', default='resnet50', type=str, |
| 60 | help="Name of the convolutional backbone to use") |
| 61 | parser.add_argument('--dilation', action='store_true', |
| 62 | help="If true, we replace stride with dilation in the last convolutional block (DC5)") |
| 63 | parser.add_argument('--position_embedding', default='sine', type=str, choices=('sine', 'learned'), |
| 64 | help="Type of positional embedding to use on top of the image features") |
| 65 | parser.add_argument('--position_embedding_scale', default=2 * np.pi, type=float, |
| 66 | help="position / size * scale") |
| 67 | parser.add_argument('--num_feature_levels', default=4, type=int, help='number of feature levels') |
| 68 | |
| 69 | # * Transformer |
| 70 | parser.add_argument('--enc_layers', default=6, type=int, |
| 71 | help="Number of encoding layers in the transformer") |
| 72 | parser.add_argument('--dec_layers', default=6, type=int, |
| 73 | help="Number of decoding layers in the transformer") |
| 74 | parser.add_argument('--dim_feedforward', default=1024, type=int, |
| 75 | help="Intermediate size of the feedforward layers in the transformer blocks") |
| 76 | parser.add_argument('--hidden_dim', default=256, type=int, |
| 77 | help="Size of the embeddings (dimension of the transformer)") |
| 78 | parser.add_argument('--dropout', default=0.1, type=float, |
| 79 | help="Dropout applied in the transformer") |
| 80 | parser.add_argument('--nheads', default=8, type=int, |
| 81 | help="Number of attention heads inside the transformer's attentions") |
| 82 | parser.add_argument('--num_queries', default=500, type=int, |
| 83 | help="Number of query slots") |
| 84 | parser.add_argument('--dec_n_points', default=4, type=int) |
| 85 | parser.add_argument('--enc_n_points', default=4, type=int) |
| 86 | |
| 87 | # * Segmentation |
| 88 | parser.add_argument('--masks', action='store_true', |
| 89 | help="Train segmentation head if the flag is provided") |
| 90 |
no outgoing calls
no test coverage detected