DivyaAnand Sinha commited on
Commit
6d89946
1 Parent(s): e83d3ba

adding model

Browse files
parser_2024-03-12 DELETED
@@ -1 +0,0 @@
1
- Subproject commit 4450ff48a28ca65362470e3b672f6d8e942c6d4e
 
 
parser_2024-03-12/config.yaml ADDED
@@ -0,0 +1,327 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CUDNN_BENCHMARK: false
2
+ DATALOADER:
3
+ ASPECT_RATIO_GROUPING: true
4
+ FILTER_EMPTY_ANNOTATIONS: true
5
+ NUM_WORKERS: 4
6
+ REPEAT_THRESHOLD: 0.0
7
+ SAMPLER_TRAIN: TrainingSampler
8
+ DATASETS:
9
+ PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000
10
+ PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000
11
+ PROPOSAL_FILES_TEST: []
12
+ PROPOSAL_FILES_TRAIN: []
13
+ TEST:
14
+ - finetune-val
15
+ TRAIN:
16
+ - finetune-train
17
+ GLOBAL:
18
+ HACK: 1.0
19
+ INPUT:
20
+ CROP:
21
+ ENABLED: false
22
+ SIZE:
23
+ - 0.9
24
+ - 0.9
25
+ TYPE: relative_range
26
+ FORMAT: BGR
27
+ MASK_FORMAT: polygon
28
+ MAX_SIZE_TEST: 1333
29
+ MAX_SIZE_TRAIN: 1333
30
+ MIN_SIZE_TEST: 800
31
+ MIN_SIZE_TRAIN:
32
+ - 640
33
+ - 672
34
+ - 704
35
+ - 736
36
+ - 768
37
+ - 800
38
+ MIN_SIZE_TRAIN_SAMPLING: choice
39
+ RANDOM_FLIP: horizontal
40
+ MODEL:
41
+ ANCHOR_GENERATOR:
42
+ ANGLES:
43
+ - - -90
44
+ - 0
45
+ - 90
46
+ ASPECT_RATIOS:
47
+ - - 0.5
48
+ - 1.0
49
+ - 2.0
50
+ NAME: DefaultAnchorGenerator
51
+ OFFSET: 0.0
52
+ SIZES:
53
+ - - 32
54
+ - - 64
55
+ - - 128
56
+ - - 256
57
+ - - 512
58
+ BACKBONE:
59
+ FREEZE_AT: 2
60
+ NAME: build_resnet_fpn_backbone
61
+ DEVICE: cuda
62
+ FPN:
63
+ FUSE_TYPE: sum
64
+ IN_FEATURES:
65
+ - res2
66
+ - res3
67
+ - res4
68
+ - res5
69
+ NORM: ''
70
+ OUT_CHANNELS: 256
71
+ KEYPOINT_ON: false
72
+ LOAD_PROPOSALS: false
73
+ MASK_ON: false
74
+ META_ARCHITECTURE: GeneralizedRCNN
75
+ PANOPTIC_FPN:
76
+ COMBINE:
77
+ ENABLED: true
78
+ INSTANCES_CONFIDENCE_THRESH: 0.5
79
+ OVERLAP_THRESH: 0.5
80
+ STUFF_AREA_LIMIT: 4096
81
+ INSTANCE_LOSS_WEIGHT: 1.0
82
+ PIXEL_MEAN:
83
+ - 103.53
84
+ - 116.28
85
+ - 123.675
86
+ PIXEL_STD:
87
+ - 1.0
88
+ - 1.0
89
+ - 1.0
90
+ PROPOSAL_GENERATOR:
91
+ MIN_SIZE: 0
92
+ NAME: RPN
93
+ RESNETS:
94
+ DEFORM_MODULATED: false
95
+ DEFORM_NUM_GROUPS: 1
96
+ DEFORM_ON_PER_STAGE:
97
+ - false
98
+ - false
99
+ - false
100
+ - false
101
+ DEPTH: 50
102
+ NORM: FrozenBN
103
+ NUM_GROUPS: 1
104
+ OUT_FEATURES:
105
+ - res2
106
+ - res3
107
+ - res4
108
+ - res5
109
+ RES2_OUT_CHANNELS: 256
110
+ RES5_DILATION: 1
111
+ STEM_OUT_CHANNELS: 64
112
+ STRIDE_IN_1X1: true
113
+ WIDTH_PER_GROUP: 64
114
+ RETINANET:
115
+ BBOX_REG_LOSS_TYPE: smooth_l1
116
+ BBOX_REG_WEIGHTS:
117
+ - 1.0
118
+ - 1.0
119
+ - 1.0
120
+ - 1.0
121
+ FOCAL_LOSS_ALPHA: 0.25
122
+ FOCAL_LOSS_GAMMA: 2.0
123
+ IN_FEATURES:
124
+ - p3
125
+ - p4
126
+ - p5
127
+ - p6
128
+ - p7
129
+ IOU_LABELS:
130
+ - 0
131
+ - -1
132
+ - 1
133
+ IOU_THRESHOLDS:
134
+ - 0.4
135
+ - 0.5
136
+ NMS_THRESH_TEST: 0.5
137
+ NORM: ''
138
+ NUM_CLASSES: 80
139
+ NUM_CONVS: 4
140
+ PRIOR_PROB: 0.01
141
+ SCORE_THRESH_TEST: 0.05
142
+ SMOOTH_L1_LOSS_BETA: 0.1
143
+ TOPK_CANDIDATES_TEST: 1000
144
+ ROI_BOX_CASCADE_HEAD:
145
+ BBOX_REG_WEIGHTS:
146
+ - - 10.0
147
+ - 10.0
148
+ - 5.0
149
+ - 5.0
150
+ - - 20.0
151
+ - 20.0
152
+ - 10.0
153
+ - 10.0
154
+ - - 30.0
155
+ - 30.0
156
+ - 15.0
157
+ - 15.0
158
+ IOUS:
159
+ - 0.5
160
+ - 0.6
161
+ - 0.7
162
+ ROI_BOX_HEAD:
163
+ BBOX_REG_LOSS_TYPE: smooth_l1
164
+ BBOX_REG_LOSS_WEIGHT: 1.0
165
+ BBOX_REG_WEIGHTS:
166
+ - 10.0
167
+ - 10.0
168
+ - 5.0
169
+ - 5.0
170
+ CLS_AGNOSTIC_BBOX_REG: false
171
+ CONV_DIM: 256
172
+ FC_DIM: 1024
173
+ NAME: FastRCNNConvFCHead
174
+ NORM: ''
175
+ NUM_CONV: 0
176
+ NUM_FC: 2
177
+ POOLER_RESOLUTION: 7
178
+ POOLER_SAMPLING_RATIO: 0
179
+ POOLER_TYPE: ROIAlignV2
180
+ SMOOTH_L1_BETA: 0.0
181
+ TRAIN_ON_PRED_BOXES: false
182
+ ROI_HEADS:
183
+ BATCH_SIZE_PER_IMAGE: 512
184
+ IN_FEATURES:
185
+ - p2
186
+ - p3
187
+ - p4
188
+ - p5
189
+ IOU_LABELS:
190
+ - 0
191
+ - 1
192
+ IOU_THRESHOLDS:
193
+ - 0.5
194
+ NAME: StandardROIHeads
195
+ NMS_THRESH_TEST: 0.5
196
+ NUM_CLASSES: 11
197
+ POSITIVE_FRACTION: 0.25
198
+ PROPOSAL_APPEND_GT: true
199
+ SCORE_THRESH_TEST: 0.05
200
+ ROI_KEYPOINT_HEAD:
201
+ CONV_DIMS:
202
+ - 512
203
+ - 512
204
+ - 512
205
+ - 512
206
+ - 512
207
+ - 512
208
+ - 512
209
+ - 512
210
+ LOSS_WEIGHT: 1.0
211
+ MIN_KEYPOINTS_PER_IMAGE: 1
212
+ NAME: KRCNNConvDeconvUpsampleHead
213
+ NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true
214
+ NUM_KEYPOINTS: 17
215
+ POOLER_RESOLUTION: 14
216
+ POOLER_SAMPLING_RATIO: 0
217
+ POOLER_TYPE: ROIAlignV2
218
+ ROI_MASK_HEAD:
219
+ CLS_AGNOSTIC_MASK: false
220
+ CONV_DIM: 256
221
+ NAME: MaskRCNNConvUpsampleHead
222
+ NORM: ''
223
+ NUM_CONV: 4
224
+ POOLER_RESOLUTION: 14
225
+ POOLER_SAMPLING_RATIO: 0
226
+ POOLER_TYPE: ROIAlignV2
227
+ RPN:
228
+ BATCH_SIZE_PER_IMAGE: 256
229
+ BBOX_REG_LOSS_TYPE: smooth_l1
230
+ BBOX_REG_LOSS_WEIGHT: 1.0
231
+ BBOX_REG_WEIGHTS:
232
+ - 1.0
233
+ - 1.0
234
+ - 1.0
235
+ - 1.0
236
+ BOUNDARY_THRESH: -1
237
+ CONV_DIMS:
238
+ - -1
239
+ HEAD_NAME: StandardRPNHead
240
+ IN_FEATURES:
241
+ - p2
242
+ - p3
243
+ - p4
244
+ - p5
245
+ - p6
246
+ IOU_LABELS:
247
+ - 0
248
+ - -1
249
+ - 1
250
+ IOU_THRESHOLDS:
251
+ - 0.3
252
+ - 0.7
253
+ LOSS_WEIGHT: 1.0
254
+ NMS_THRESH: 0.7
255
+ POSITIVE_FRACTION: 0.5
256
+ POST_NMS_TOPK_TEST: 1000
257
+ POST_NMS_TOPK_TRAIN: 1000
258
+ PRE_NMS_TOPK_TEST: 1000
259
+ PRE_NMS_TOPK_TRAIN: 2000
260
+ SMOOTH_L1_BETA: 0.0
261
+ SEM_SEG_HEAD:
262
+ COMMON_STRIDE: 4
263
+ CONVS_DIM: 128
264
+ IGNORE_VALUE: 255
265
+ IN_FEATURES:
266
+ - p2
267
+ - p3
268
+ - p4
269
+ - p5
270
+ LOSS_WEIGHT: 1.0
271
+ NAME: SemSegFPNHead
272
+ NORM: GN
273
+ NUM_CLASSES: 54
274
+ WEIGHTS: /home/ubuntu/layout-parser/models/DocLayNet-large_fast_rcnn_R_50_FPN_3x/model_final.pth
275
+ OUTPUT_DIR: ./outputs/finetune/fast_rcnn_R_50_FPN_3x/
276
+ SEED: -1
277
+ SOLVER:
278
+ AMP:
279
+ ENABLED: false
280
+ BASE_LR: 0.00025
281
+ BIAS_LR_FACTOR: 1.0
282
+ CHECKPOINT_PERIOD: 20000
283
+ CLIP_GRADIENTS:
284
+ CLIP_TYPE: value
285
+ CLIP_VALUE: 1.0
286
+ ENABLED: false
287
+ NORM_TYPE: 2.0
288
+ GAMMA: 0.1
289
+ IMS_PER_BATCH: 2
290
+ LR_SCHEDULER_NAME: WarmupMultiStepLR
291
+ MAX_ITER: 60000
292
+ MOMENTUM: 0.9
293
+ NESTEROV: false
294
+ REFERENCE_WORLD_SIZE: 0
295
+ STEPS:
296
+ - 210000
297
+ - 250000
298
+ WARMUP_FACTOR: 0.001
299
+ WARMUP_ITERS: 1000
300
+ WARMUP_METHOD: linear
301
+ WEIGHT_DECAY: 0.0001
302
+ WEIGHT_DECAY_BIAS: 0.0001
303
+ WEIGHT_DECAY_NORM: 0.0
304
+ TEST:
305
+ AUG:
306
+ ENABLED: false
307
+ FLIP: true
308
+ MAX_SIZE: 4000
309
+ MIN_SIZES:
310
+ - 400
311
+ - 500
312
+ - 600
313
+ - 700
314
+ - 800
315
+ - 900
316
+ - 1000
317
+ - 1100
318
+ - 1200
319
+ DETECTIONS_PER_IMAGE: 100
320
+ EVAL_PERIOD: 0
321
+ EXPECTED_RESULTS: []
322
+ KEYPOINT_OKS_SIGMAS: []
323
+ PRECISE_BN:
324
+ ENABLED: false
325
+ NUM_ITER: 200
326
+ VERSION: 2
327
+ VIS_PERIOD: 0
parser_2024-03-12/eval.csv ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ,bbox
2
+ AP,48.744662430853865
3
+ AP50,74.36064012361008
4
+ AP75,53.027459747550274
5
+ APs,0.0
6
+ APm,13.334398325824157
7
+ APl,53.40041646256427
8
+ AP-Caption,45.51980198019802
9
+ AP-Footnote,47.66849132392231
10
+ AP-Formula,
11
+ AP-Page-footer,25.746028461057037
12
+ AP-Page-header,67.44123203400125
13
+ AP-Picture,48.699900371420455
14
+ AP-Section-header,45.18482922396696
15
+ AP-Table,73.22847798677735
16
+ AP-Table-of-contents,52.62376237623763
17
+ AP-Text,55.35390253115556
18
+ AP-Title,25.980198019801975
parser_2024-03-12/events.out.tfevents.1710183741.ip-192-170-5-19.2783.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e90d51c0292ccc6d37f8737680ecd22bdb2ba1b3fcdaa0e8f35f6ed0d6ea19a3
3
+ size 2612801
parser_2024-03-12/inference/coco_instances_results.json ADDED
The diff for this file is too large to render. See raw diff
 
parser_2024-03-12/inference/instances_predictions.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e27b998ce19b78a65f82964714d359f7d6df1f7f298e217c555d3226a9479c77
3
+ size 90720
parser_2024-03-12/last_checkpoint ADDED
@@ -0,0 +1 @@
 
 
1
+ model_final.pth
parser_2024-03-12/log.txt ADDED
The diff for this file is too large to render. See raw diff
 
parser_2024-03-12/metrics.json ADDED
The diff for this file is too large to render. See raw diff
 
parser_2024-03-12/model_0019999.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e66a4eb57effe4ed278b7df33d494d1e9abff92c7161fadbd5b6594a3b6ee60
3
+ size 165917860
parser_2024-03-12/model_0039999.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce2f188e14b18bed144e07742f89313e34679cca31c84b747810e1c0fc396b3e
3
+ size 165917860
parser_2024-03-12/model_0059999.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08fa35a54c5d6aa9e8f49c27843c4e3f2194631449090955625565b13a578717
3
+ size 165917860
parser_2024-03-12/model_final.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08fa35a54c5d6aa9e8f49c27843c4e3f2194631449090955625565b13a578717
3
+ size 165917860