RoyRud1902 commited on
Commit
4b09a94
·
verified ·
1 Parent(s): ecd872a

Upload 9 files

Browse files
Files changed (10) hide show
  1. .gitattributes +3 -0
  2. BoxPR_curve.png +0 -0
  3. args.yaml +106 -0
  4. best.pt +3 -0
  5. config.json +39 -0
  6. confusion_matrix.png +3 -0
  7. example_inference.py +55 -0
  8. labels.jpg +3 -0
  9. results.csv +51 -0
  10. results.png +3 -0
.gitattributes CHANGED
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ confusion_matrix.png filter=lfs diff=lfs merge=lfs -text
37
+ labels.jpg filter=lfs diff=lfs merge=lfs -text
38
+ results.png filter=lfs diff=lfs merge=lfs -text
BoxPR_curve.png ADDED
args.yaml ADDED
@@ -0,0 +1,106 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ task: detect
2
+ mode: train
3
+ model: yolo11n.pt
4
+ data: C:\Users\oleks\Projects\yolo-gui-detect\datasets\hf_yolo_text\dataset.yaml
5
+ epochs: 50
6
+ time: null
7
+ patience: 100
8
+ batch: 16
9
+ imgsz: 640
10
+ save: true
11
+ save_period: -1
12
+ cache: false
13
+ device: '0'
14
+ workers: 8
15
+ project: runs
16
+ name: text_boxes12
17
+ exist_ok: false
18
+ pretrained: true
19
+ optimizer: auto
20
+ verbose: true
21
+ seed: 0
22
+ deterministic: true
23
+ single_cls: false
24
+ rect: false
25
+ cos_lr: false
26
+ close_mosaic: 10
27
+ resume: false
28
+ amp: true
29
+ fraction: 1.0
30
+ profile: false
31
+ freeze: null
32
+ multi_scale: false
33
+ compile: false
34
+ overlap_mask: true
35
+ mask_ratio: 4
36
+ dropout: 0.0
37
+ val: true
38
+ split: val
39
+ save_json: false
40
+ conf: null
41
+ iou: 0.7
42
+ max_det: 300
43
+ half: false
44
+ dnn: false
45
+ plots: true
46
+ source: null
47
+ vid_stride: 1
48
+ stream_buffer: false
49
+ visualize: false
50
+ augment: false
51
+ agnostic_nms: false
52
+ classes: null
53
+ retina_masks: false
54
+ embed: null
55
+ show: false
56
+ save_frames: false
57
+ save_txt: false
58
+ save_conf: false
59
+ save_crop: false
60
+ show_labels: true
61
+ show_conf: true
62
+ show_boxes: true
63
+ line_width: null
64
+ format: torchscript
65
+ keras: false
66
+ optimize: false
67
+ int8: false
68
+ dynamic: false
69
+ simplify: true
70
+ opset: null
71
+ workspace: null
72
+ nms: false
73
+ lr0: 0.01
74
+ lrf: 0.01
75
+ momentum: 0.937
76
+ weight_decay: 0.0005
77
+ warmup_epochs: 3.0
78
+ warmup_momentum: 0.8
79
+ warmup_bias_lr: 0.1
80
+ box: 7.5
81
+ cls: 0.5
82
+ dfl: 1.5
83
+ pose: 12.0
84
+ kobj: 1.0
85
+ nbs: 64
86
+ hsv_h: 0.015
87
+ hsv_s: 0.7
88
+ hsv_v: 0.4
89
+ degrees: 0.0
90
+ translate: 0.1
91
+ scale: 0.5
92
+ shear: 0.0
93
+ perspective: 0.0
94
+ flipud: 0.0
95
+ fliplr: 0.5
96
+ bgr: 0.0
97
+ mosaic: 1.0
98
+ mixup: 0.0
99
+ cutmix: 0.0
100
+ copy_paste: 0.0
101
+ copy_paste_mode: flip
102
+ auto_augment: randaugment
103
+ erasing: 0.4
104
+ cfg: null
105
+ tracker: botsort.yaml
106
+ save_dir: C:\Users\oleks\Projects\yolo-gui-detect\text_box_detector\runs\text_boxes12
best.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce26dca363a67fe96c09cc51bed5d09de887239ad5f8a1bd71ee216c2f602a20
3
+ size 5452890
config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name": "YOLO11n Text",
3
+ "model_type": "yolo11",
4
+ "task": "object-detection",
5
+ "library_name": "ultralytics",
6
+ "architectures": ["YOLO11n"],
7
+ "num_classes": 1,
8
+ "class_names": ["text"],
9
+ "input_size": 640,
10
+ "num_parameters": 2590035,
11
+ "num_layers": 181,
12
+ "training": {
13
+ "epochs": 50,
14
+ "batch_size": 16,
15
+ "optimizer": "SGD",
16
+ "learning_rate": 0.01,
17
+ "momentum": 0.937,
18
+ "weight_decay": 0.0005,
19
+ "warmup_epochs": 3.0,
20
+ "amp": true
21
+ },
22
+ "dataset": {
23
+ "name": "DonkeySmall/Yolo-Text-Detection",
24
+ "train_images": 22661,
25
+ "val_images": 2518,
26
+ "total_images": 25179
27
+ },
28
+ "metrics": {
29
+ "precision": 0.957,
30
+ "recall": 0.936,
31
+ "mAP50": 0.976,
32
+ "mAP50-95": 0.818
33
+ },
34
+ "inference": {
35
+ "recommended_conf": 0.25,
36
+ "recommended_iou": 0.7,
37
+ "max_det": 300
38
+ }
39
+ }
confusion_matrix.png ADDED

Git LFS Details

  • SHA256: 52d7d9095610b4c1f19791b35ae7e0bb9a639338ee107098acfdc28b2726dbc8
  • Pointer size: 131 Bytes
  • Size of remote file: 104 kB
example_inference.py ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """
2
+ Example inference script for YOLO11n Text model.
3
+
4
+ Usage:
5
+ python example_inference.py --image path/to/image.jpg
6
+ python example_inference.py --image path/to/folder/
7
+ """
8
+
9
+ import argparse
10
+ from pathlib import Path
11
+
12
+ from ultralytics import YOLO
13
+
14
+
15
+ def main():
16
+ parser = argparse.ArgumentParser(description="Text Detection Inference")
17
+ parser.add_argument("--image", required=True, help="Image file or folder path")
18
+ parser.add_argument("--conf", type=float, default=0.25, help="Confidence threshold")
19
+ parser.add_argument("--iou", type=float, default=0.7, help="NMS IoU threshold")
20
+ parser.add_argument("--imgsz", type=int, default=640, help="Input image size")
21
+ parser.add_argument("--save", action="store_true", help="Save annotated images")
22
+ parser.add_argument("--show", action="store_true", help="Display results")
23
+ args = parser.parse_args()
24
+
25
+ # Load model
26
+ model_path = Path(__file__).parent / "best.pt"
27
+ model = YOLO(str(model_path))
28
+
29
+ # Run inference
30
+ results = model.predict(
31
+ source=args.image,
32
+ conf=args.conf,
33
+ iou=args.iou,
34
+ imgsz=args.imgsz,
35
+ save=args.save,
36
+ show=args.show,
37
+ )
38
+
39
+ # Print results
40
+ for result in results:
41
+ print(f"\nImage: {result.path}")
42
+ print(f"Shape: {result.orig_shape}")
43
+
44
+ if result.boxes is not None and len(result.boxes) > 0:
45
+ print(f"Detected {len(result.boxes)} text regions:")
46
+ for i, box in enumerate(result.boxes):
47
+ xyxy = box.xyxy[0].tolist()
48
+ conf = box.conf[0].item()
49
+ print(f" [{i+1}] bbox: [{xyxy[0]:.1f}, {xyxy[1]:.1f}, {xyxy[2]:.1f}, {xyxy[3]:.1f}], conf: {conf:.3f}")
50
+ else:
51
+ print("No text regions detected")
52
+
53
+
54
+ if __name__ == "__main__":
55
+ main()
labels.jpg ADDED

Git LFS Details

  • SHA256: 6a4b35f638d217ff69fbceeef28705ea900c5915ddfff5e4d26fa41bffb6517a
  • Pointer size: 131 Bytes
  • Size of remote file: 114 kB
results.csv ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ epoch,time,train/box_loss,train/cls_loss,train/dfl_loss,metrics/precision(B),metrics/recall(B),metrics/mAP50(B),metrics/mAP50-95(B),val/box_loss,val/cls_loss,val/dfl_loss,lr/pg0,lr/pg1,lr/pg2
2
+ 1,154.093,1.2432,1.23426,1.03086,0.86022,0.82695,0.89058,0.64336,0.92094,0.80819,0.90889,0.00333098,0.00333098,0.00333098
3
+ 2,273.784,1.09391,0.81848,0.94377,0.89725,0.86219,0.92329,0.68476,0.87448,0.68099,0.89064,0.00653236,0.00653236,0.00653236
4
+ 3,387.418,1.07926,0.75591,0.93997,0.90161,0.85934,0.92001,0.67618,0.88285,0.6765,0.90021,0.00960174,0.00960174,0.00960174
5
+ 4,509.311,1.0335,0.70211,0.93485,0.90339,0.86523,0.92962,0.71274,0.81937,0.60264,0.88824,0.009406,0.009406,0.009406
6
+ 5,637.592,0.96942,0.64274,0.92023,0.90704,0.87834,0.93286,0.72119,0.79064,0.56958,0.88459,0.009208,0.009208,0.009208
7
+ 6,765.563,0.92774,0.60917,0.91118,0.92522,0.88832,0.94737,0.74274,0.76671,0.53699,0.87052,0.00901,0.00901,0.00901
8
+ 7,893.736,0.90253,0.58819,0.90554,0.92358,0.89375,0.9509,0.75135,0.74591,0.51681,0.86721,0.008812,0.008812,0.008812
9
+ 8,1021.67,0.87914,0.5709,0.90027,0.92724,0.90226,0.95354,0.7572,0.72941,0.4979,0.86243,0.008614,0.008614,0.008614
10
+ 9,1150.23,0.86648,0.56036,0.89636,0.93368,0.90227,0.95635,0.76262,0.72678,0.48946,0.86017,0.008416,0.008416,0.008416
11
+ 10,1279.48,0.85714,0.55088,0.89375,0.93526,0.90722,0.95918,0.768,0.70915,0.47671,0.85659,0.008218,0.008218,0.008218
12
+ 11,1408.18,0.84386,0.54158,0.89062,0.93339,0.90856,0.95939,0.77142,0.70693,0.46934,0.85429,0.00802,0.00802,0.00802
13
+ 12,1536.38,0.83054,0.53386,0.88762,0.94049,0.91059,0.9627,0.77856,0.69378,0.45941,0.85215,0.007822,0.007822,0.007822
14
+ 13,1665.25,0.82851,0.52797,0.88595,0.93987,0.91479,0.96265,0.78229,0.68491,0.45152,0.84986,0.007624,0.007624,0.007624
15
+ 14,1793.28,0.81664,0.51847,0.88358,0.94245,0.91514,0.96484,0.78467,0.67759,0.44609,0.84821,0.007426,0.007426,0.007426
16
+ 15,1905.26,0.81278,0.51685,0.88222,0.94215,0.91691,0.96526,0.78737,0.67714,0.44264,0.84634,0.007228,0.007228,0.007228
17
+ 16,2016.91,0.8072,0.51053,0.88117,0.94265,0.91882,0.96668,0.78863,0.67236,0.43562,0.84601,0.00703,0.00703,0.00703
18
+ 17,2142.17,0.80111,0.5061,0.87938,0.94511,0.91844,0.96602,0.79173,0.66569,0.42941,0.84451,0.006832,0.006832,0.006832
19
+ 18,2268.49,0.79787,0.50307,0.87866,0.94573,0.91983,0.9677,0.79452,0.6609,0.42684,0.84307,0.006634,0.006634,0.006634
20
+ 19,2394.83,0.79362,0.49963,0.87721,0.9481,0.9212,0.96825,0.79583,0.6605,0.42168,0.8427,0.006436,0.006436,0.006436
21
+ 20,2521.3,0.78738,0.49556,0.8759,0.94787,0.92029,0.96884,0.79463,0.66034,0.42175,0.84153,0.006238,0.006238,0.006238
22
+ 21,2647.71,0.78345,0.49071,0.87408,0.9491,0.92387,0.9701,0.79744,0.65692,0.41688,0.84079,0.00604,0.00604,0.00604
23
+ 22,2774.45,0.78216,0.48843,0.87405,0.94858,0.92568,0.97081,0.80026,0.65316,0.41254,0.83971,0.005842,0.005842,0.005842
24
+ 23,2900.8,0.77318,0.48282,0.8724,0.95027,0.9263,0.97062,0.80097,0.64951,0.41003,0.83846,0.005644,0.005644,0.005644
25
+ 24,3027.78,0.76892,0.48028,0.87104,0.95034,0.92815,0.97179,0.80309,0.64708,0.40639,0.83776,0.005446,0.005446,0.005446
26
+ 25,3151.48,0.76707,0.47686,0.87031,0.95126,0.92725,0.9719,0.80494,0.64343,0.40364,0.83696,0.005248,0.005248,0.005248
27
+ 26,3263.27,0.76325,0.47532,0.86913,0.95111,0.92866,0.97241,0.80477,0.64294,0.40178,0.8363,0.00505,0.00505,0.00505
28
+ 27,3375.44,0.7591,0.46989,0.8677,0.95249,0.92946,0.97297,0.80634,0.64057,0.39869,0.8354,0.004852,0.004852,0.004852
29
+ 28,3502.31,0.75676,0.46995,0.86821,0.9537,0.92844,0.97319,0.80714,0.63859,0.39799,0.83474,0.004654,0.004654,0.004654
30
+ 29,3628.76,0.75311,0.46632,0.86675,0.95205,0.93071,0.9734,0.80756,0.63723,0.39632,0.83414,0.004456,0.004456,0.004456
31
+ 30,3754.91,0.75138,0.46451,0.86665,0.95148,0.93148,0.9731,0.80817,0.63534,0.39486,0.8339,0.004258,0.004258,0.004258
32
+ 31,3880.99,0.74725,0.46125,0.86602,0.95322,0.93186,0.97375,0.80924,0.63411,0.39284,0.83343,0.00406,0.00406,0.00406
33
+ 32,4007.19,0.74221,0.45726,0.864,0.95528,0.93063,0.97414,0.81016,0.63231,0.39047,0.83313,0.003862,0.003862,0.003862
34
+ 33,4133.37,0.74048,0.4549,0.8638,0.95582,0.93099,0.97423,0.81046,0.63138,0.38955,0.83264,0.003664,0.003664,0.003664
35
+ 34,4259.58,0.74076,0.4536,0.86304,0.95571,0.93147,0.97443,0.81134,0.63089,0.3881,0.83263,0.003466,0.003466,0.003466
36
+ 35,4385.74,0.73558,0.45047,0.86155,0.95533,0.93244,0.97474,0.81173,0.63019,0.38677,0.8323,0.003268,0.003268,0.003268
37
+ 36,4512.17,0.73209,0.448,0.86206,0.95476,0.93337,0.97493,0.81227,0.62909,0.38577,0.83178,0.00307,0.00307,0.00307
38
+ 37,4638.18,0.73095,0.44575,0.86158,0.9548,0.934,0.97513,0.8131,0.62784,0.38439,0.83137,0.002872,0.002872,0.002872
39
+ 38,4764.77,0.72744,0.44342,0.85946,0.95524,0.93449,0.97522,0.81386,0.62676,0.38326,0.83076,0.002674,0.002674,0.002674
40
+ 39,4891.29,0.72515,0.44117,0.85999,0.95593,0.93421,0.97529,0.81424,0.62599,0.38245,0.83051,0.002476,0.002476,0.002476
41
+ 40,5018.86,0.71995,0.43761,0.85823,0.95614,0.93474,0.97555,0.81486,0.62493,0.38155,0.83013,0.002278,0.002278,0.002278
42
+ 41,5166.44,0.68209,0.42159,0.84599,0.95489,0.93566,0.9755,0.81513,0.62405,0.38098,0.82988,0.00208,0.00208,0.00208
43
+ 42,5289.42,0.67706,0.41656,0.84451,0.95466,0.93632,0.97563,0.81566,0.62297,0.38008,0.8296,0.001882,0.001882,0.001882
44
+ 43,5412.28,0.67274,0.41285,0.84379,0.9556,0.93589,0.97574,0.816,0.62218,0.37928,0.82938,0.001684,0.001684,0.001684
45
+ 44,5534.82,0.66862,0.40797,0.84317,0.95703,0.93508,0.97592,0.81639,0.62156,0.37856,0.82924,0.001486,0.001486,0.001486
46
+ 45,5657.32,0.66297,0.40462,0.84211,0.95747,0.93487,0.97593,0.81667,0.62095,0.37812,0.82899,0.001288,0.001288,0.001288
47
+ 46,5779.71,0.65899,0.40042,0.84059,0.95768,0.93504,0.97605,0.81714,0.62027,0.37755,0.82878,0.00109,0.00109,0.00109
48
+ 47,5902.23,0.65664,0.39733,0.83976,0.95692,0.93581,0.97608,0.81733,0.61986,0.37717,0.8286,0.000892,0.000892,0.000892
49
+ 48,6024.16,0.65297,0.39491,0.8391,0.9567,0.93624,0.97611,0.81773,0.61939,0.37666,0.82847,0.000694,0.000694,0.000694
50
+ 49,6145.84,0.64891,0.39072,0.83855,0.957,0.93597,0.97618,0.81808,0.61896,0.37637,0.82832,0.000496,0.000496,0.000496
51
+ 50,6267.38,0.64526,0.38754,0.83837,0.95733,0.93614,0.97629,0.81822,0.61867,0.37596,0.82813,0.000298,0.000298,0.000298
results.png ADDED

Git LFS Details

  • SHA256: 0e5275b9387a471a41eb557819f898c1ae45e86dea63ef26148e503cc118bb4d
  • Pointer size: 131 Bytes
  • Size of remote file: 247 kB