From 24060e4ce7233a97d636857f1cd14128c91d4aab Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Nguy=E1=BB=85n=20Ph=C6=B0=E1=BB=9Bc=20Th=C3=A0nh?=
 <93478665+Zeres-Engel@users.noreply.github.com>
Date: Tue, 5 Aug 2025 19:09:55 +0700
Subject: [PATCH] init

---
 .gitignore                                    |  17 +
 README_ID_Card_Processing.md                  | 183 ++++++++++
 config/config.yaml                            |  48 +++
 data_augmentation.log                         | 222 ++++++++++++
 id_card_processor_main.py                     | 234 ++++++++++++
 main.py                                       | 276 ++++++++++++++
 src/__init__.py                               |  23 ++
 src/__pycache__/__init__.cpython-313.pyc      | Bin 0 -> 589 bytes
 src/__pycache__/__init__.cpython-39.pyc       | Bin 0 -> 559 bytes
 src/__pycache__/config_manager.cpython-39.pyc | Bin 0 -> 6334 bytes
 .../data_augmentation.cpython-39.pyc          | Bin 0 -> 5323 bytes
 .../image_processor.cpython-39.pyc            | Bin 0 -> 5218 bytes
 src/__pycache__/utils.cpython-313.pyc         | Bin 0 -> 5478 bytes
 src/__pycache__/utils.cpython-39.pyc          | Bin 0 -> 3426 bytes
 src/config.py                                 |  40 ++
 src/config_manager.py                         | 175 +++++++++
 src/data_augmentation.py                      | 161 ++++++++
 src/image_processor.py                        | 174 +++++++++
 src/model/__init__.py                         |   8 +
 src/model/__pycache__/__init__.cpython-39.pyc | Bin 0 -> 352 bytes
 .../id_card_processor.cpython-39.pyc          | Bin 0 -> 8960 bytes
 .../__pycache__/yolo_detector.cpython-39.pyc  | Bin 0 -> 7104 bytes
 src/model/id_card_processor.py                | 343 ++++++++++++++++++
 src/model/yolo_detector.py                    | 266 ++++++++++++++
 src/utils.py                                  |  98 +++++
 25 files changed, 2268 insertions(+)
 create mode 100644 .gitignore
 create mode 100644 README_ID_Card_Processing.md
 create mode 100644 config/config.yaml
 create mode 100644 data_augmentation.log
 create mode 100644 id_card_processor_main.py
 create mode 100644 main.py
 create mode 100644 src/__init__.py
 create mode 100644 src/__pycache__/__init__.cpython-313.pyc
 create mode 100644 src/__pycache__/__init__.cpython-39.pyc
 create mode 100644 src/__pycache__/config_manager.cpython-39.pyc
 create mode 100644 src/__pycache__/data_augmentation.cpython-39.pyc
 create mode 100644 src/__pycache__/image_processor.cpython-39.pyc
 create mode 100644 src/__pycache__/utils.cpython-313.pyc
 create mode 100644 src/__pycache__/utils.cpython-39.pyc
 create mode 100644 src/config.py
 create mode 100644 src/config_manager.py
 create mode 100644 src/data_augmentation.py
 create mode 100644 src/image_processor.py
 create mode 100644 src/model/__init__.py
 create mode 100644 src/model/__pycache__/__init__.cpython-39.pyc
 create mode 100644 src/model/__pycache__/id_card_processor.cpython-39.pyc
 create mode 100644 src/model/__pycache__/yolo_detector.cpython-39.pyc
 create mode 100644 src/model/id_card_processor.py
 create mode 100644 src/model/yolo_detector.py
 create mode 100644 src/utils.py

diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..70d391f
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,17 @@
+*.png
+*.json
+*.jpg
+*.zip
+*.rar
+*.pdf
+*.docx
+*.doc
+*.xls
+*.xlsx
+*.ppt
+*.pptx
+*.txt
+*.csv
+*.json
+*.pt
+*.ipynb
diff --git a/README_ID_Card_Processing.md b/README_ID_Card_Processing.md
new file mode 100644
index 0000000..3e922a4
--- /dev/null
+++ b/README_ID_Card_Processing.md
@@ -0,0 +1,183 @@
+# ID Card Processing with YOLO Detection
+
+Hệ thống xử lý ID cards sử dụng YOLO để detect và crop, kết hợp với các phương pháp tiền xử lý để clean background và enhance chất lượng ảnh.
+
+## Tính năng chính
+
+- **YOLO Detection**: Detect và crop ID cards từ ảnh gốc
+- **Background Removal**: 3 phương pháp loại bỏ background (GrabCut, Threshold, Contour)
+- **Image Enhancement**: Cải thiện chất lượng ảnh cho OCR
+- **Batch Processing**: Xử lý hàng loạt ảnh
+- **Flexible Pipeline**: Có thể chạy từng bước riêng biệt
+
+## Cài đặt
+
+1. Cài đặt dependencies:
+```bash
+pip install -r requirements.txt
+```
+
+2. Cấu trúc thư mục:
+```
+OCR/
+├── src/
+│   ├── model/
+│   │   ├── __init__.py
+│   │   ├── yolo_detector.py
+│   │   └── id_card_processor.py
+│   └── ...
+├── data/
+│   ├── IDcards/          # Thư mục chứa ảnh ID cards gốc
+│   └── processed_id_cards/ # Thư mục output
+├── id_card_processor_main.py
+└── requirements.txt
+```
+
+## Sử dụng
+
+### 1. Full Pipeline (Detect + Preprocess)
+
+```bash
+python id_card_processor_main.py \
+    --input-dir "data/IDcards" \
+    --output-dir "data/processed_id_cards" \
+    --confidence 0.5 \
+    --bg-removal grabcut \
+    --target-size 800x600 \
+    --save-annotated
+```
+
+### 2. Chỉ Detect và Crop
+
+```bash
+python id_card_processor_main.py \
+    --input-dir "data/IDcards" \
+    --output-dir "data/processed_id_cards" \
+    --detect-only \
+    --save-annotated
+```
+
+### 3. Chỉ Preprocess (bỏ qua detection)
+
+```bash
+python id_card_processor_main.py \
+    --input-dir "data/IDcards" \
+    --output-dir "data/processed_id_cards" \
+    --preprocess-only \
+    --bg-removal threshold \
+    --target-size 800x600
+```
+
+## Các tham số
+
+### Detection Parameters
+- `--model-path`: Đường dẫn đến custom YOLO model (.pt file)
+- `--confidence`: Ngưỡng confidence cho detection (default: 0.5)
+
+### Preprocessing Parameters
+- `--bg-removal`: Phương pháp loại bỏ background
+  - `grabcut`: Sử dụng GrabCut algorithm (recommended)
+  - `threshold`: Sử dụng thresholding
+  - `contour`: Sử dụng contour detection
+  - `none`: Không loại bỏ background
+- `--target-size`: Kích thước chuẩn hóa (width x height)
+
+### Output Options
+- `--save-annotated`: Lưu ảnh với bounding boxes
+- `--detect-only`: Chỉ chạy detection
+- `--preprocess-only`: Chỉ chạy preprocessing
+
+## Output Structure
+
+```
+data/processed_id_cards/
+├── cropped/           # Ảnh đã được crop từ YOLO
+│   ├── image1_card_1.jpg
+│   ├── image1_card_2.jpg
+│   └── ...
+├── processed/         # Ảnh đã được preprocess
+│   ├── image1_card_1_processed.jpg
+│   ├── image1_card_2_processed.jpg
+│   └── ...
+└── annotated/         # Ảnh với bounding boxes (nếu có)
+    ├── image1_annotated.jpg
+    └── ...
+```
+
+## Ví dụ sử dụng
+
+### Ví dụ 1: Xử lý toàn bộ dataset
+```bash
+# Xử lý tất cả ảnh trong thư mục IDcards
+python id_card_processor_main.py \
+    --input-dir "data/IDcards" \
+    --output-dir "data/processed_id_cards" \
+    --confidence 0.6 \
+    --bg-removal grabcut \
+    --target-size 1024x768 \
+    --save-annotated
+```
+
+### Ví dụ 2: Test với một vài ảnh
+```bash
+# Tạo thư mục test với một vài ảnh
+mkdir -p data/test_images
+# Copy một vài ảnh vào test_images
+
+# Chạy detection
+python id_card_processor_main.py \
+    --input-dir "data/test_images" \
+    --output-dir "data/test_output" \
+    --detect-only \
+    --save-annotated
+```
+
+### Ví dụ 3: Sử dụng custom model
+```bash
+# Nếu bạn có custom YOLO model đã train
+python id_card_processor_main.py \
+    --input-dir "data/IDcards" \
+    --output-dir "data/processed_id_cards" \
+    --model-path "models/custom_id_card_model.pt" \
+    --confidence 0.7
+```
+
+## Lưu ý
+
+1. **YOLO Model**: Mặc định sử dụng YOLOv8n pre-trained. Nếu có custom model tốt hơn, hãy sử dụng `--model-path`
+
+2. **Background Removal**: 
+   - `grabcut`: Tốt nhất cho ID cards có background phức tạp
+   - `threshold`: Nhanh, phù hợp với background đơn giản
+   - `contour`: Phù hợp với ID cards có viền rõ ràng
+
+3. **Performance**: 
+   - Sử dụng GPU nếu có thể để tăng tốc độ detection
+   - Có thể điều chỉnh `--confidence` để cân bằng giữa precision và recall
+
+4. **Memory**: Với dataset lớn, có thể cần tăng memory hoặc xử lý theo batch nhỏ hơn
+
+## Troubleshooting
+
+### Lỗi thường gặp
+
+1. **No detections found**: 
+   - Giảm `--confidence` xuống 0.3-0.4
+   - Kiểm tra chất lượng ảnh input
+
+2. **Memory error**:
+   - Giảm batch size hoặc xử lý từng ảnh một
+   - Sử dụng CPU thay vì GPU
+
+3. **Poor background removal**:
+   - Thử các phương pháp khác nhau: `grabcut`, `threshold`, `contour`
+   - Điều chỉnh parameters trong code
+
+### Debug mode
+
+```bash
+python id_card_processor_main.py \
+    --input-dir "data/IDcards" \
+    --output-dir "data/processed_id_cards" \
+    --log-level DEBUG
+``` 
\ No newline at end of file
diff --git a/config/config.yaml b/config/config.yaml
new file mode 100644
index 0000000..96b942f
--- /dev/null
+++ b/config/config.yaml
@@ -0,0 +1,48 @@
+# Data Augmentation Configuration
+# Main configuration file for image data augmentation
+
+# Paths configuration
+paths:
+  input_dir: "data/Archive"
+  output_dir: "out"
+  log_file: "logs/data_augmentation.log"
+
+# Data augmentation parameters - ONLY ROTATION
+augmentation:
+  # Geometric transformations - ONLY ROTATION
+  rotation:
+    enabled: true
+    angles: [30, 60, 120, 150, 180, 210, 240, 300, 330]  # Specific rotation angles
+    probability: 1.0  # Always apply rotation
+
+# Processing configuration
+processing:
+  target_size: [224, 224]  # [width, height]
+  batch_size: 32
+  num_augmentations: 3  # number of augmented versions per image
+  save_format: "jpg"
+  quality: 95
+
+# Supported image formats
+supported_formats:
+  - ".jpg"
+  - ".jpeg"
+  - ".png"
+  - ".bmp"
+  - ".tiff"
+
+# Logging configuration
+logging:
+  level: "INFO"  # DEBUG, INFO, WARNING, ERROR
+  format: "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
+  handlers:
+    - type: "file"
+      filename: "logs/data_augmentation.log"
+    - type: "console"
+
+# Performance settings
+performance:
+  num_workers: 4
+  prefetch_factor: 2
+  pin_memory: true
+  use_gpu: false 
\ No newline at end of file
diff --git a/data_augmentation.log b/data_augmentation.log
new file mode 100644
index 0000000..2405a6d
--- /dev/null
+++ b/data_augmentation.log
@@ -0,0 +1,222 @@
+2025-08-05 18:53:06,981 - src.model.yolo_detector - INFO - Using pre-trained YOLOv8n model
+2025-08-05 18:53:07,004 - src.model.yolo_detector - INFO - Using device: cuda
+2025-08-05 18:53:07,038 - src.model.yolo_detector - INFO - Using pre-trained YOLOv8n model
+2025-08-05 18:53:07,038 - src.model.yolo_detector - INFO - Using device: cuda
+2025-08-05 18:53:07,361 - src.model.yolo_detector - INFO - Using pre-trained YOLOv8n model
+2025-08-05 18:53:07,362 - src.model.yolo_detector - INFO - Using device: cuda
+2025-08-05 18:53:07,363 - src.model.id_card_processor - INFO - Detecting and cropping ID cards...
+2025-08-05 18:53:07,363 - src.model.yolo_detector - ERROR - No images found in data\IDcards
+2025-08-05 18:53:07,364 - src.model.id_card_processor - INFO - Processing cropped ID cards...
+2025-08-05 18:53:07,364 - src.model.id_card_processor - ERROR - No images found in data\test_output\cropped
+2025-08-05 19:04:14,903 - src.model.yolo_detector - INFO - Using pre-trained YOLOv8n model
+2025-08-05 19:04:14,995 - src.model.yolo_detector - INFO - Using device: cuda
+2025-08-05 19:04:14,996 - src.model.id_card_processor - INFO - Detecting and cropping ID cards...
+2025-08-05 19:04:14,997 - src.model.yolo_detector - INFO - Processing 29 images from data\IDcards and subdirectories
+2025-08-05 19:04:14,998 - src.model.yolo_detector - INFO - Processing 1/29: im10.png
+2025-08-05 19:04:19,785 - src.model.yolo_detector - INFO - Found 1 detections in im10.png
+2025-08-05 19:04:19,813 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im10_card_1.jpg
+2025-08-05 19:04:19,813 - src.model.yolo_detector - INFO - Processed im10.png: 1 cards cropped
+2025-08-05 19:04:19,814 - src.model.yolo_detector - INFO - Processing 2/29: im11.png
+2025-08-05 19:04:19,926 - src.model.yolo_detector - INFO - Found 2 detections in im11.png
+2025-08-05 19:04:19,937 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im11_card_1.jpg
+2025-08-05 19:04:19,946 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im11_card_2.jpg
+2025-08-05 19:04:19,946 - src.model.yolo_detector - INFO - Processed im11.png: 2 cards cropped
+2025-08-05 19:04:19,946 - src.model.yolo_detector - INFO - Processing 3/29: im12.png
+2025-08-05 19:04:20,056 - src.model.yolo_detector - INFO - Found 2 detections in im12.png
+2025-08-05 19:04:20,069 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im12_card_1.jpg
+2025-08-05 19:04:20,082 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im12_card_2.jpg
+2025-08-05 19:04:20,083 - src.model.yolo_detector - INFO - Processed im12.png: 2 cards cropped
+2025-08-05 19:04:20,083 - src.model.yolo_detector - INFO - Processing 4/29: im13.png
+2025-08-05 19:04:20,116 - src.model.yolo_detector - INFO - Found 0 detections in im13.png
+2025-08-05 19:04:20,117 - src.model.yolo_detector - WARNING - No ID cards detected in im13.png
+2025-08-05 19:04:20,117 - src.model.yolo_detector - INFO - Processing 5/29: im14.png
+2025-08-05 19:04:20,156 - src.model.yolo_detector - INFO - Found 1 detections in im14.png
+2025-08-05 19:04:20,172 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im14_card_1.jpg
+2025-08-05 19:04:20,173 - src.model.yolo_detector - INFO - Processed im14.png: 1 cards cropped
+2025-08-05 19:04:20,174 - src.model.yolo_detector - INFO - Processing 6/29: im15.png
+2025-08-05 19:04:20,208 - src.model.yolo_detector - INFO - Found 1 detections in im15.png
+2025-08-05 19:04:20,222 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im15_card_1.jpg
+2025-08-05 19:04:20,222 - src.model.yolo_detector - INFO - Processed im15.png: 1 cards cropped
+2025-08-05 19:04:20,223 - src.model.yolo_detector - INFO - Processing 7/29: im1_.png
+2025-08-05 19:04:20,466 - src.model.yolo_detector - INFO - Found 0 detections in im1_.png
+2025-08-05 19:04:20,466 - src.model.yolo_detector - WARNING - No ID cards detected in im1_.png
+2025-08-05 19:04:20,466 - src.model.yolo_detector - INFO - Processing 8/29: im2.png
+2025-08-05 19:04:20,534 - src.model.yolo_detector - INFO - Found 2 detections in im2.png
+2025-08-05 19:04:20,564 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im2_card_1.jpg
+2025-08-05 19:04:20,594 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im2_card_2.jpg
+2025-08-05 19:04:20,594 - src.model.yolo_detector - INFO - Processed im2.png: 2 cards cropped
+2025-08-05 19:04:20,595 - src.model.yolo_detector - INFO - Processing 9/29: im3.png
+2025-08-05 19:04:20,648 - src.model.yolo_detector - INFO - Found 1 detections in im3.png
+2025-08-05 19:04:20,671 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im3_card_1.jpg
+2025-08-05 19:04:20,671 - src.model.yolo_detector - INFO - Processed im3.png: 1 cards cropped
+2025-08-05 19:04:20,672 - src.model.yolo_detector - INFO - Processing 10/29: im4.png
+2025-08-05 19:04:20,724 - src.model.yolo_detector - INFO - Found 1 detections in im4.png
+2025-08-05 19:04:20,753 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im4_card_1.jpg
+2025-08-05 19:04:20,754 - src.model.yolo_detector - INFO - Processed im4.png: 1 cards cropped
+2025-08-05 19:04:20,754 - src.model.yolo_detector - INFO - Processing 11/29: im5.png
+2025-08-05 19:04:20,798 - src.model.yolo_detector - INFO - Found 2 detections in im5.png
+2025-08-05 19:04:20,816 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im5_card_1.jpg
+2025-08-05 19:04:20,835 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im5_card_2.jpg
+2025-08-05 19:04:20,836 - src.model.yolo_detector - INFO - Processed im5.png: 2 cards cropped
+2025-08-05 19:04:20,837 - src.model.yolo_detector - INFO - Processing 12/29: im6.png
+2025-08-05 19:04:20,994 - src.model.yolo_detector - INFO - Found 2 detections in im6.png
+2025-08-05 19:04:21,052 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im6_card_1.jpg
+2025-08-05 19:04:21,118 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im6_card_2.jpg
+2025-08-05 19:04:21,119 - src.model.yolo_detector - INFO - Processed im6.png: 2 cards cropped
+2025-08-05 19:04:21,120 - src.model.yolo_detector - INFO - Processing 13/29: im7.png
+2025-08-05 19:04:21,159 - src.model.yolo_detector - INFO - Found 3 detections in im7.png
+2025-08-05 19:04:21,168 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im7_card_1.jpg
+2025-08-05 19:04:21,176 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im7_card_2.jpg
+2025-08-05 19:04:21,184 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im7_card_3.jpg
+2025-08-05 19:04:21,184 - src.model.yolo_detector - INFO - Processed im7.png: 3 cards cropped
+2025-08-05 19:04:21,185 - src.model.yolo_detector - INFO - Processing 14/29: im8.png
+2025-08-05 19:04:21,353 - src.model.yolo_detector - INFO - Found 2 detections in im8.png
+2025-08-05 19:04:21,387 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im8_card_1.jpg
+2025-08-05 19:04:21,423 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im8_card_2.jpg
+2025-08-05 19:04:21,424 - src.model.yolo_detector - INFO - Processed im8.png: 2 cards cropped
+2025-08-05 19:04:21,425 - src.model.yolo_detector - INFO - Processing 15/29: im9.png
+2025-08-05 19:04:21,522 - src.model.yolo_detector - INFO - Found 1 detections in im9.png
+2025-08-05 19:04:21,532 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\Archive\im9_card_1.jpg
+2025-08-05 19:04:21,532 - src.model.yolo_detector - INFO - Processed im9.png: 1 cards cropped
+2025-08-05 19:04:21,532 - src.model.yolo_detector - INFO - Processing 16/29: im10.png
+2025-08-05 19:04:21,585 - src.model.yolo_detector - INFO - Found 3 detections in im10.png
+2025-08-05 19:04:21,601 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im10_card_1.jpg
+2025-08-05 19:04:21,618 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im10_card_2.jpg
+2025-08-05 19:04:21,636 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im10_card_3.jpg
+2025-08-05 19:04:21,636 - src.model.yolo_detector - INFO - Processed im10.png: 3 cards cropped
+2025-08-05 19:04:21,638 - src.model.yolo_detector - INFO - Processing 17/29: im11.png
+2025-08-05 19:04:21,679 - src.model.yolo_detector - INFO - Found 2 detections in im11.png
+2025-08-05 19:04:21,696 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im11_card_1.jpg
+2025-08-05 19:04:21,712 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im11_card_2.jpg
+2025-08-05 19:04:21,713 - src.model.yolo_detector - INFO - Processed im11.png: 2 cards cropped
+2025-08-05 19:04:21,713 - src.model.yolo_detector - INFO - Processing 18/29: im12.png
+2025-08-05 19:04:21,755 - src.model.yolo_detector - INFO - Found 0 detections in im12.png
+2025-08-05 19:04:21,756 - src.model.yolo_detector - WARNING - No ID cards detected in im12.png
+2025-08-05 19:04:21,756 - src.model.yolo_detector - INFO - Processing 19/29: im13.png
+2025-08-05 19:04:21,793 - src.model.yolo_detector - INFO - Found 1 detections in im13.png
+2025-08-05 19:04:21,806 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im13_card_1.jpg
+2025-08-05 19:04:21,806 - src.model.yolo_detector - INFO - Processed im13.png: 1 cards cropped
+2025-08-05 19:04:21,806 - src.model.yolo_detector - INFO - Processing 20/29: im14.png
+2025-08-05 19:04:21,846 - src.model.yolo_detector - INFO - Found 2 detections in im14.png
+2025-08-05 19:04:21,862 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im14_card_1.jpg
+2025-08-05 19:04:21,877 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im14_card_2.jpg
+2025-08-05 19:04:21,877 - src.model.yolo_detector - INFO - Processed im14.png: 2 cards cropped
+2025-08-05 19:04:21,878 - src.model.yolo_detector - INFO - Processing 21/29: im15.png
+2025-08-05 19:04:21,914 - src.model.yolo_detector - INFO - Found 0 detections in im15.png
+2025-08-05 19:04:21,914 - src.model.yolo_detector - WARNING - No ID cards detected in im15.png
+2025-08-05 19:04:21,914 - src.model.yolo_detector - INFO - Processing 22/29: im1_.png
+2025-08-05 19:04:21,959 - src.model.yolo_detector - INFO - Found 3 detections in im1_.png
+2025-08-05 19:04:21,971 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im1__card_1.jpg
+2025-08-05 19:04:21,983 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im1__card_2.jpg
+2025-08-05 19:04:21,996 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im1__card_3.jpg
+2025-08-05 19:04:21,997 - src.model.yolo_detector - INFO - Processed im1_.png: 3 cards cropped
+2025-08-05 19:04:21,997 - src.model.yolo_detector - INFO - Processing 23/29: im2.png
+2025-08-05 19:04:22,101 - src.model.yolo_detector - INFO - Found 1 detections in im2.png
+2025-08-05 19:04:22,174 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im2_card_1.jpg
+2025-08-05 19:04:22,174 - src.model.yolo_detector - INFO - Processed im2.png: 1 cards cropped
+2025-08-05 19:04:22,176 - src.model.yolo_detector - INFO - Processing 24/29: im3.png
+2025-08-05 19:04:22,220 - src.model.yolo_detector - INFO - Found 2 detections in im3.png
+2025-08-05 19:04:22,235 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im3_card_1.jpg
+2025-08-05 19:04:22,251 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im3_card_2.jpg
+2025-08-05 19:04:22,252 - src.model.yolo_detector - INFO - Processed im3.png: 2 cards cropped
+2025-08-05 19:04:22,252 - src.model.yolo_detector - INFO - Processing 25/29: im5.png
+2025-08-05 19:04:22,307 - src.model.yolo_detector - INFO - Found 1 detections in im5.png
+2025-08-05 19:04:22,316 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im5_card_1.jpg
+2025-08-05 19:04:22,316 - src.model.yolo_detector - INFO - Processed im5.png: 1 cards cropped
+2025-08-05 19:04:22,317 - src.model.yolo_detector - INFO - Processing 26/29: im6.png
+2025-08-05 19:04:22,375 - src.model.yolo_detector - INFO - Found 2 detections in im6.png
+2025-08-05 19:04:22,387 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im6_card_1.jpg
+2025-08-05 19:04:22,397 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im6_card_2.jpg
+2025-08-05 19:04:22,398 - src.model.yolo_detector - INFO - Processed im6.png: 2 cards cropped
+2025-08-05 19:04:22,399 - src.model.yolo_detector - INFO - Processing 27/29: im7.png
+2025-08-05 19:04:22,441 - src.model.yolo_detector - INFO - Found 1 detections in im7.png
+2025-08-05 19:04:22,458 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im7_card_1.jpg
+2025-08-05 19:04:22,459 - src.model.yolo_detector - INFO - Processed im7.png: 1 cards cropped
+2025-08-05 19:04:22,460 - src.model.yolo_detector - INFO - Processing 28/29: im8.png
+2025-08-05 19:04:22,492 - src.model.yolo_detector - INFO - Found 2 detections in im8.png
+2025-08-05 19:04:22,502 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im8_card_1.jpg
+2025-08-05 19:04:22,509 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im8_card_2.jpg
+2025-08-05 19:04:22,510 - src.model.yolo_detector - INFO - Processed im8.png: 2 cards cropped
+2025-08-05 19:04:22,510 - src.model.yolo_detector - INFO - Processing 29/29: im9.png
+2025-08-05 19:04:22,540 - src.model.yolo_detector - INFO - Found 1 detections in im9.png
+2025-08-05 19:04:22,546 - src.model.yolo_detector - INFO - Saved cropped image to data\processed_id_cards\cropped\titre-sejour-fr\im9_card_1.jpg
+2025-08-05 19:04:22,546 - src.model.yolo_detector - INFO - Processed im9.png: 1 cards cropped
+2025-08-05 19:04:22,546 - src.model.yolo_detector - INFO - Batch processing completed:
+2025-08-05 19:04:22,548 - src.model.yolo_detector - INFO -   - Total images: 29
+2025-08-05 19:04:22,548 - src.model.yolo_detector - INFO -   - Processed: 25
+2025-08-05 19:04:22,548 - src.model.yolo_detector - INFO -   - Total detections: 42
+2025-08-05 19:04:22,549 - src.model.yolo_detector - INFO -   - Total cropped: 42
+2025-08-05 19:04:22,549 - src.model.id_card_processor - INFO - Processing cropped ID cards...
+2025-08-05 19:04:22,552 - src.model.id_card_processor - INFO - Processing 42 images from data\processed_id_cards\cropped and subdirectories
+2025-08-05 19:04:22,552 - src.model.id_card_processor - INFO - Processing 1/42: im10_card_1.jpg
+2025-08-05 19:04:22,564 - src.model.id_card_processor - INFO - Removing background from im10_card_1.jpg
+2025-08-05 19:04:22,877 - src.model.id_card_processor - INFO - Enhancing im10_card_1.jpg
+2025-08-05 19:04:23,016 - src.model.id_card_processor - INFO - Normalizing im10_card_1.jpg
+2025-08-05 19:04:23,023 - src.model.id_card_processor - INFO - Processed im10_card_1.jpg
+2025-08-05 19:04:23,023 - src.model.id_card_processor - INFO - Processing 2/42: im11_card_1.jpg
+2025-08-05 19:04:23,034 - src.model.id_card_processor - INFO - Removing background from im11_card_1.jpg
+2025-08-05 19:04:23,264 - src.model.id_card_processor - INFO - Enhancing im11_card_1.jpg
+2025-08-05 19:04:23,265 - src.model.id_card_processor - INFO - Normalizing im11_card_1.jpg
+2025-08-05 19:04:23,270 - src.model.id_card_processor - INFO - Processed im11_card_1.jpg
+2025-08-05 19:04:23,271 - src.model.id_card_processor - INFO - Processing 3/42: im11_card_2.jpg
+2025-08-05 19:04:23,282 - src.model.id_card_processor - INFO - Removing background from im11_card_2.jpg
+2025-08-05 19:04:23,312 - src.model.id_card_processor - INFO - Enhancing im11_card_2.jpg
+2025-08-05 19:04:23,313 - src.model.id_card_processor - INFO - Normalizing im11_card_2.jpg
+2025-08-05 19:04:23,316 - src.model.id_card_processor - INFO - Processed im11_card_2.jpg
+2025-08-05 19:04:23,316 - src.model.id_card_processor - INFO - Processing 4/42: im12_card_1.jpg
+2025-08-05 19:04:23,328 - src.model.id_card_processor - INFO - Removing background from im12_card_1.jpg
+2025-08-05 19:04:23,670 - src.model.id_card_processor - INFO - Enhancing im12_card_1.jpg
+2025-08-05 19:04:23,671 - src.model.id_card_processor - INFO - Normalizing im12_card_1.jpg
+2025-08-05 19:04:23,675 - src.model.id_card_processor - INFO - Processed im12_card_1.jpg
+2025-08-05 19:04:23,676 - src.model.id_card_processor - INFO - Processing 5/42: im12_card_2.jpg
+2025-08-05 19:04:23,686 - src.model.id_card_processor - INFO - Removing background from im12_card_2.jpg
+2025-08-05 19:04:29,279 - src.model.id_card_processor - INFO - Enhancing im12_card_2.jpg
+2025-08-05 19:04:29,284 - src.model.id_card_processor - INFO - Normalizing im12_card_2.jpg
+2025-08-05 19:04:29,289 - src.model.id_card_processor - INFO - Processed im12_card_2.jpg
+2025-08-05 19:04:29,290 - src.model.id_card_processor - INFO - Processing 6/42: im14_card_1.jpg
+2025-08-05 19:04:29,301 - src.model.id_card_processor - INFO - Removing background from im14_card_1.jpg
+2025-08-05 19:04:29,774 - src.model.id_card_processor - INFO - Enhancing im14_card_1.jpg
+2025-08-05 19:04:29,775 - src.model.id_card_processor - INFO - Normalizing im14_card_1.jpg
+2025-08-05 19:04:29,779 - src.model.id_card_processor - INFO - Processed im14_card_1.jpg
+2025-08-05 19:04:29,780 - src.model.id_card_processor - INFO - Processing 7/42: im15_card_1.jpg
+2025-08-05 19:04:29,791 - src.model.id_card_processor - INFO - Removing background from im15_card_1.jpg
+2025-08-05 19:04:30,009 - src.model.id_card_processor - INFO - Enhancing im15_card_1.jpg
+2025-08-05 19:04:30,010 - src.model.id_card_processor - INFO - Normalizing im15_card_1.jpg
+2025-08-05 19:04:30,015 - src.model.id_card_processor - INFO - Processed im15_card_1.jpg
+2025-08-05 19:04:30,015 - src.model.id_card_processor - INFO - Processing 8/42: im2_card_1.jpg
+2025-08-05 19:04:30,017 - src.model.id_card_processor - INFO - Removing background from im2_card_1.jpg
+2025-08-05 19:04:31,861 - src.model.id_card_processor - INFO - Enhancing im2_card_1.jpg
+2025-08-05 19:04:31,863 - src.model.id_card_processor - INFO - Normalizing im2_card_1.jpg
+2025-08-05 19:04:31,869 - src.model.id_card_processor - INFO - Processed im2_card_1.jpg
+2025-08-05 19:04:31,869 - src.model.id_card_processor - INFO - Processing 9/42: im2_card_2.jpg
+2025-08-05 19:04:31,884 - src.model.id_card_processor - INFO - Removing background from im2_card_2.jpg
+2025-08-05 19:04:38,985 - src.model.id_card_processor - INFO - Enhancing im2_card_2.jpg
+2025-08-05 19:04:38,996 - src.model.id_card_processor - INFO - Normalizing im2_card_2.jpg
+2025-08-05 19:04:39,007 - src.model.id_card_processor - INFO - Processed im2_card_2.jpg
+2025-08-05 19:04:39,008 - src.model.id_card_processor - INFO - Processing 10/42: im3_card_1.jpg
+2025-08-05 19:04:39,009 - src.model.id_card_processor - INFO - Removing background from im3_card_1.jpg
+2025-08-05 19:04:39,177 - src.model.id_card_processor - INFO - Enhancing im3_card_1.jpg
+2025-08-05 19:04:39,178 - src.model.id_card_processor - INFO - Normalizing im3_card_1.jpg
+2025-08-05 19:04:39,182 - src.model.id_card_processor - INFO - Processed im3_card_1.jpg
+2025-08-05 19:04:39,182 - src.model.id_card_processor - INFO - Processing 11/42: im4_card_1.jpg
+2025-08-05 19:04:39,184 - src.model.id_card_processor - INFO - Removing background from im4_card_1.jpg
+2025-08-05 19:04:39,374 - src.model.id_card_processor - INFO - Enhancing im4_card_1.jpg
+2025-08-05 19:04:39,375 - src.model.id_card_processor - INFO - Normalizing im4_card_1.jpg
+2025-08-05 19:04:39,379 - src.model.id_card_processor - INFO - Processed im4_card_1.jpg
+2025-08-05 19:04:39,379 - src.model.id_card_processor - INFO - Processing 12/42: im5_card_1.jpg
+2025-08-05 19:04:39,389 - src.model.id_card_processor - INFO - Removing background from im5_card_1.jpg
+2025-08-05 19:04:39,842 - src.model.id_card_processor - INFO - Enhancing im5_card_1.jpg
+2025-08-05 19:04:39,843 - src.model.id_card_processor - INFO - Normalizing im5_card_1.jpg
+2025-08-05 19:04:39,846 - src.model.id_card_processor - INFO - Processed im5_card_1.jpg
+2025-08-05 19:04:39,846 - src.model.id_card_processor - INFO - Processing 13/42: im5_card_2.jpg
+2025-08-05 19:04:39,859 - src.model.id_card_processor - INFO - Removing background from im5_card_2.jpg
+2025-08-05 19:04:42,430 - src.model.id_card_processor - INFO - Enhancing im5_card_2.jpg
+2025-08-05 19:04:42,434 - src.model.id_card_processor - INFO - Normalizing im5_card_2.jpg
+2025-08-05 19:04:42,438 - src.model.id_card_processor - INFO - Processed im5_card_2.jpg
+2025-08-05 19:04:42,439 - src.model.id_card_processor - INFO - Processing 14/42: im6_card_1.jpg
+2025-08-05 19:04:42,449 - src.model.id_card_processor - INFO - Removing background from im6_card_1.jpg
+2025-08-05 19:04:47,647 - src.model.id_card_processor - INFO - Enhancing im6_card_1.jpg
+2025-08-05 19:04:47,652 - src.model.id_card_processor - INFO - Normalizing im6_card_1.jpg
+2025-08-05 19:04:47,657 - src.model.id_card_processor - INFO - Processed im6_card_1.jpg
+2025-08-05 19:04:47,657 - src.model.id_card_processor - INFO - Processing 15/42: im6_card_2.jpg
+2025-08-05 19:04:47,680 - src.model.id_card_processor - INFO - Removing background from im6_card_2.jpg
diff --git a/id_card_processor_main.py b/id_card_processor_main.py
new file mode 100644
index 0000000..5dabff9
--- /dev/null
+++ b/id_card_processor_main.py
@@ -0,0 +1,234 @@
+"""
+Main script for ID Card Processing with YOLO Detection
+"""
+import argparse
+import sys
+from pathlib import Path
+from typing import Dict, Any
+import logging
+
+# Add src to path for imports
+sys.path.append(str(Path(__file__).parent / "src"))
+
+from src.model.yolo_detector import YOLODetector
+from src.model.id_card_processor import IDCardProcessor
+from src.utils import setup_logging
+
+def parse_arguments():
+    """Parse command line arguments"""
+    parser = argparse.ArgumentParser(description="ID Card Processing with YOLO Detection")
+    
+    parser.add_argument(
+        "--input-dir", 
+        type=str, 
+        required=True,
+        help="Input directory containing ID card images"
+    )
+    
+    parser.add_argument(
+        "--output-dir", 
+        type=str, 
+        default="data/processed_id_cards",
+        help="Output directory for processed images"
+    )
+    
+    parser.add_argument(
+        "--model-path", 
+        type=str, 
+        help="Path to custom YOLO model (.pt file)"
+    )
+    
+    parser.add_argument(
+        "--confidence", 
+        type=float, 
+        default=0.5,
+        help="Confidence threshold for YOLO detection"
+    )
+    
+    parser.add_argument(
+        "--detect-only", 
+        action="store_true",
+        help="Only detect and crop ID cards, skip preprocessing"
+    )
+    
+    parser.add_argument(
+        "--preprocess-only", 
+        action="store_true",
+        help="Skip detection, directly preprocess images"
+    )
+    
+    parser.add_argument(
+        "--bg-removal", 
+        type=str, 
+        default="grabcut",
+        choices=["grabcut", "threshold", "contour", "none"],
+        help="Background removal method"
+    )
+    
+    parser.add_argument(
+        "--target-size", 
+        type=str, 
+        default="800x600",
+        help="Target size for normalization (width x height)"
+    )
+    
+    parser.add_argument(
+        "--save-annotated", 
+        action="store_true",
+        help="Save annotated images with bounding boxes"
+    )
+    
+    parser.add_argument(
+        "--log-level", 
+        type=str, 
+        default="INFO",
+        choices=["DEBUG", "INFO", "WARNING", "ERROR"],
+        help="Logging level"
+    )
+    
+    return parser.parse_args()
+
+def parse_size(size_str: str) -> tuple:
+    """Parse size string like '800x600' to tuple (800, 600)"""
+    try:
+        width, height = map(int, size_str.split('x'))
+        return (width, height)
+    except ValueError:
+        print(f"Invalid size format: {size_str}. Expected format: widthxheight")
+        sys.exit(1)
+
+def main():
+    """Main function"""
+    args = parse_arguments()
+    
+    # Setup logging
+    logging_config = {"level": args.log_level}
+    logger = setup_logging(logging_config.get("level", "INFO"))
+    logger.info("Starting ID Card Processing")
+    
+    # Parse paths
+    input_dir = Path(args.input_dir)
+    output_dir = Path(args.output_dir)
+    
+    # Check if input directory exists
+    if not input_dir.exists():
+        logger.error(f"Input directory does not exist: {input_dir}")
+        sys.exit(1)
+    
+    # Create output directory
+    output_dir.mkdir(parents=True, exist_ok=True)
+    
+    # Parse target size
+    target_size = parse_size(args.target_size)
+    
+    # Initialize YOLO detector
+    logger.info("Initializing YOLO detector...")
+    yolo_detector = YOLODetector(
+        model_path=args.model_path,
+        confidence=args.confidence
+    )
+    
+    # Initialize ID card processor
+    logger.info("Initializing ID card processor...")
+    id_processor = IDCardProcessor(yolo_detector)
+    
+    if args.detect_only:
+        # Only detect and crop ID cards
+        logger.info("Running YOLO detection only...")
+        results = yolo_detector.batch_process(
+            input_dir, 
+            output_dir / "cropped",
+            save_annotated=args.save_annotated
+        )
+        
+        print("\n" + "="*50)
+        print("YOLO DETECTION RESULTS")
+        print("="*50)
+        print(f"Total images: {results['total_images']}")
+        print(f"Processed images: {results['processed_images']}")
+        print(f"Total detections: {results['total_detections']}")
+        print(f"Total cropped: {results['total_cropped']}")
+        print(f"Output directory: {output_dir / 'cropped'}")
+        print("="*50)
+        
+    elif args.preprocess_only:
+        # Skip detection, directly preprocess
+        logger.info("Running preprocessing only...")
+        results = id_processor.batch_process_id_cards(
+            input_dir, 
+            output_dir / "processed",
+            detect_first=False,
+            remove_bg=args.bg_removal != "none",
+            enhance=True,
+            normalize=True,
+            target_size=target_size
+        )
+        
+        print("\n" + "="*50)
+        print("PREPROCESSING RESULTS")
+        print("="*50)
+        print(f"Total images: {results['total_images']}")
+        print(f"Processed images: {results['processed_images']}")
+        print(f"Output directory: {output_dir / 'processed'}")
+        print("="*50)
+        
+    else:
+        # Full pipeline: detect + preprocess
+        logger.info("Running full pipeline: detection + preprocessing...")
+        
+        # Step 1: Detect and crop ID cards
+        logger.info("Step 1: Detecting and cropping ID cards...")
+        detection_results = yolo_detector.batch_process(
+            input_dir, 
+            output_dir / "cropped",
+            save_annotated=args.save_annotated
+        )
+        
+        # Step 2: Preprocess cropped images
+        cropped_dir = output_dir / "cropped"
+        if cropped_dir.exists():
+            logger.info("Step 2: Preprocessing cropped ID cards...")
+            preprocessing_results = id_processor.batch_process_id_cards(
+                cropped_dir, 
+                output_dir / "processed",
+                detect_first=False,
+                remove_bg=args.bg_removal != "none",
+                enhance=True,
+                normalize=True,
+                target_size=target_size
+            )
+        else:
+            logger.warning("No cropped images found, preprocessing original images")
+            preprocessing_results = id_processor.batch_process_id_cards(
+                input_dir, 
+                output_dir / "processed",
+                detect_first=False,
+                remove_bg=args.bg_removal != "none",
+                enhance=True,
+                normalize=True,
+                target_size=target_size
+            )
+        
+        # Print summary
+        print("\n" + "="*50)
+        print("FULL PIPELINE RESULTS")
+        print("="*50)
+        print("DETECTION PHASE:")
+        print(f"  - Total images: {detection_results['total_images']}")
+        print(f"  - Processed images: {detection_results['processed_images']}")
+        print(f"  - Total detections: {detection_results['total_detections']}")
+        print(f"  - Total cropped: {detection_results['total_cropped']}")
+        print("\nPREPROCESSING PHASE:")
+        print(f"  - Total images: {preprocessing_results['total_images']}")
+        print(f"  - Processed images: {preprocessing_results['processed_images']}")
+        print(f"\nOutput directories:")
+        print(f"  - Cropped images: {output_dir / 'cropped'}")
+        print(f"  - Processed images: {output_dir / 'processed'}")
+        if args.save_annotated:
+            print(f"  - Annotated images: {output_dir / 'cropped'}")
+        print("="*50)
+    
+    logger.info("ID Card Processing completed successfully")
+
+if __name__ == "__main__":
+    main() 
\ No newline at end of file
diff --git a/main.py b/main.py
new file mode 100644
index 0000000..c544951
--- /dev/null
+++ b/main.py
@@ -0,0 +1,276 @@
+"""
+Main script for data augmentation
+"""
+import argparse
+import sys
+from pathlib import Path
+from typing import Dict, Any
+
+# Add src to path for imports
+sys.path.append(str(Path(__file__).parent / "src"))
+
+from src.config_manager import ConfigManager
+from src.data_augmentation import DataAugmentation
+from src.image_processor import ImageProcessor
+from src.utils import setup_logging, get_image_files, print_progress
+
+def parse_arguments():
+    """Parse command line arguments"""
+    parser = argparse.ArgumentParser(description="Image Data Augmentation Tool")
+    
+    parser.add_argument(
+        "--config", 
+        type=str, 
+        default="config/config.yaml",
+        help="Path to configuration file"
+    )
+    
+    parser.add_argument(
+        "--preset", 
+        type=str, 
+        help="Apply augmentation preset (light, medium, heavy, ocr_optimized, document)"
+    )
+    
+    parser.add_argument(
+        "--input-dir", 
+        type=str, 
+        help="Input directory containing images (overrides config)"
+    )
+    
+    parser.add_argument(
+        "--output-dir", 
+        type=str, 
+        help="Output directory for augmented images (overrides config)"
+    )
+    
+    parser.add_argument(
+        "--num-augmentations", 
+        type=int, 
+        help="Number of augmented versions per image (overrides config)"
+    )
+    
+    parser.add_argument(
+        "--target-size", 
+        type=str, 
+        help="Target size for images (width x height) (overrides config)"
+    )
+    
+    parser.add_argument(
+        "--preview", 
+        action="store_true",
+        help="Preview augmentation on first image only"
+    )
+    
+    parser.add_argument(
+        "--info", 
+        action="store_true",
+        help="Show information about images in input directory"
+    )
+    
+
+    
+    parser.add_argument(
+        "--list-presets", 
+        action="store_true",
+        help="List available presets and exit"
+    )
+    
+    parser.add_argument(
+        "--log-level", 
+        type=str, 
+        default="INFO",
+        choices=["DEBUG", "INFO", "WARNING", "ERROR"],
+        help="Logging level"
+    )
+    
+    return parser.parse_args()
+
+def parse_range(range_str: str) -> tuple:
+    """Parse range string like '0.8-1.2' to tuple (0.8, 1.2)"""
+    try:
+        min_val, max_val = map(float, range_str.split('-'))
+        return (min_val, max_val)
+    except ValueError:
+        print(f"Invalid range format: {range_str}. Expected format: min-max")
+        sys.exit(1)
+
+def parse_size(size_str: str) -> tuple:
+    """Parse size string like '224x224' to tuple (224, 224)"""
+    try:
+        width, height = map(int, size_str.split('x'))
+        return (width, height)
+    except ValueError:
+        print(f"Invalid size format: {size_str}. Expected format: widthxheight")
+        sys.exit(1)
+
+def show_image_info(input_dir: Path):
+    """Show information about images in input directory"""
+    image_files = get_image_files(input_dir)
+    
+    if not image_files:
+        print(f"No images found in {input_dir}")
+        return
+    
+    print(f"\nFound {len(image_files)} images in {input_dir}")
+    print("\nImage Information:")
+    print("-" * 80)
+    
+    processor = ImageProcessor()
+    total_size = 0
+    
+    for i, image_path in enumerate(image_files[:10]):  # Show first 10 images
+        info = processor.get_image_info(image_path)
+        if info:
+            print(f"{i+1:2d}. {image_path.name}")
+            print(f"     Size: {info['width']}x{info['height']} pixels")
+            print(f"     Channels: {info['channels']}")
+            print(f"     File size: {info['file_size_mb']} MB")
+            print(f"     Format: {info['format']}")
+            total_size += info['file_size_mb']
+    
+    if len(image_files) > 10:
+        print(f"\n... and {len(image_files) - 10} more images")
+    
+    print(f"\nTotal file size: {total_size:.2f} MB")
+    print(f"Average file size: {total_size/len(image_files):.2f} MB")
+
+def preview_augmentation(input_dir: Path, output_dir: Path, config: Dict[str, Any]):
+    """Preview augmentation on first image"""
+    image_files = get_image_files(input_dir)
+    
+    if not image_files:
+        print(f"No images found in {input_dir}")
+        return
+    
+    print(f"\nPreviewing augmentation on: {image_files[0].name}")
+    
+    # Create augmentation instance
+    augmenter = DataAugmentation(config)
+    
+    # Augment first image
+    augmented_paths = augmenter.augment_image_file(
+        image_files[0], 
+        output_dir, 
+        num_augmentations=3
+    )
+    
+    if augmented_paths:
+        print(f"Created {len(augmented_paths)} augmented versions:")
+        for i, path in enumerate(augmented_paths, 1):
+            print(f"  {i}. {path.name}")
+    else:
+        print("Failed to create augmented images")
+
+def main():
+    """Main function"""
+    args = parse_arguments()
+    
+    # Initialize config manager
+    config_manager = ConfigManager(args.config)
+    
+    # List presets if requested
+    if args.list_presets:
+        presets = config_manager.list_presets()
+        print("\nAvailable presets:")
+        for preset in presets:
+            print(f"  - {preset}")
+        return
+    
+    # Apply preset if specified
+    if args.preset:
+        if not config_manager.apply_preset(args.preset):
+            sys.exit(1)
+    
+
+    
+    # Override config with command line arguments
+    if args.input_dir:
+        config_manager.update_config({"paths": {"input_dir": args.input_dir}})
+    
+    if args.output_dir:
+        config_manager.update_config({"paths": {"output_dir": args.output_dir}})
+    
+    if args.num_augmentations:
+        config_manager.update_config({"processing": {"num_augmentations": args.num_augmentations}})
+    
+    if args.target_size:
+        target_size = parse_size(args.target_size)
+        config_manager.update_config({"processing": {"target_size": list(target_size)}})
+    
+    # Get configuration
+    config = config_manager.get_config()
+    paths_config = config_manager.get_paths_config()
+    processing_config = config_manager.get_processing_config()
+    augmentation_config = config_manager.get_augmentation_config()
+    logging_config = config_manager.get_logging_config()
+    
+    # Setup logging
+    logger = setup_logging(logging_config.get("level", "INFO"))
+    logger.info("Starting data augmentation process")
+    
+    # Parse paths
+    input_dir = Path(paths_config.get("input_dir", "data/dataset/training_data/images"))
+    output_dir = Path(paths_config.get("output_dir", "data/augmented_data"))
+    
+    # Check if input directory exists
+    if not input_dir.exists():
+        logger.error(f"Input directory does not exist: {input_dir}")
+        sys.exit(1)
+    
+    # Create output directory
+    output_dir.mkdir(parents=True, exist_ok=True)
+    
+    # Show image information if requested
+    if args.info:
+        show_image_info(input_dir)
+        return
+    
+    # Preview augmentation if requested
+    if args.preview:
+        preview_augmentation(input_dir, output_dir, augmentation_config)
+        return
+    
+    # Get image files
+    image_files = get_image_files(input_dir)
+    
+    if not image_files:
+        logger.error(f"No images found in {input_dir}")
+        sys.exit(1)
+    
+    logger.info(f"Found {len(image_files)} images to process")
+    logger.info(f"Output directory: {output_dir}")
+    logger.info(f"Number of augmentations per image: {processing_config.get('num_augmentations', 3)}")
+    logger.info(f"Target size: {processing_config.get('target_size', [224, 224])}")
+    
+    # Create augmentation instance with new config
+    augmenter = DataAugmentation(augmentation_config)
+    
+    # Update target size
+    target_size = tuple(processing_config.get("target_size", [224, 224]))
+    augmenter.image_processor.target_size = target_size
+    
+    # Perform batch augmentation
+    logger.info("Starting batch augmentation...")
+    results = augmenter.batch_augment(
+        input_dir, 
+        output_dir, 
+        num_augmentations=processing_config.get("num_augmentations", 3)
+    )
+    
+    # Get and display summary
+    summary = augmenter.get_augmentation_summary(results)
+    
+    print("\n" + "="*50)
+    print("AUGMENTATION SUMMARY")
+    print("="*50)
+    print(f"Original images: {summary['total_original_images']}")
+    print(f"Augmented images: {summary['total_augmented_images']}")
+    print(f"Augmentation ratio: {summary['augmentation_ratio']:.2f}")
+    print(f"Successful augmentations: {summary['successful_augmentations']}")
+    print(f"Output directory: {output_dir}")
+    print("="*50)
+    
+    logger.info("Data augmentation completed successfully")
+
+if __name__ == "__main__":
+    main() 
\ No newline at end of file
diff --git a/src/__init__.py b/src/__init__.py
new file mode 100644
index 0000000..47078f4
--- /dev/null
+++ b/src/__init__.py
@@ -0,0 +1,23 @@
+"""
+Data Augmentation Package
+"""
+
+__version__ = "1.0.0"
+__author__ = "OCR Data Augmentation Tool"
+
+from .utils import *
+from .image_processor import ImageProcessor
+from .data_augmentation import DataAugmentation
+from .config_manager import ConfigManager
+
+__all__ = [
+    "ImageProcessor",
+    "DataAugmentation",
+    "ConfigManager",
+    "setup_logging",
+    "get_image_files",
+    "load_image",
+    "save_image",
+    "validate_image",
+    "print_progress",
+] 
\ No newline at end of file
diff --git a/src/__pycache__/__init__.cpython-313.pyc b/src/__pycache__/__init__.cpython-313.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..49581cad59e510881d38143517717adc2f997416
GIT binary patch
literal 589
zcmZWlO>5gg5Z#p}%U&b9ff7o4(N!rp>8TJ(p(GS)(>ATzn_yYw&1Q+L6}u}#d`kX7
zFZ~g{_kZ+S7JN!Cy`}XZ=txRGpmP}B3^Q-un{5;k1o7qbhqG&p&~;P%4(}Fhp9A=a
zQlwFeHBLS4rM=Xj_a1vO0u;>sS)hX!_vigtsKXYA^TBMWhcVhm>EI34L<|$Men5_y
zW%09GEO}{}m8y(SSboj~C+pzR^k90hzW@5@ZT$b(JEe;6pb{n6;XO#>7fV<>(JJT0
zC=H!E&DOu%(2I^#c`C(AR>H7OhS~=T9W<#A$wh|Sx}t>=LYBf!1h-T+#Pn1a+&EGw
zw&*&J7`EcKc)VhTTrm5muCy#It+Wyv^t?(&E~Ip!a!TEZ(iPVR%tApZWwkw18gNis
zSr|9z4#I9{rPb(mfStkY-&eJ=-8gR@(Pd|;vjMkQQBe8`ZNU|Cd--AZ-oVkU6!itq
zj=4Fvs><NEnbCPhsVt?XbXr}w!IPz0)CGU4@4;&GVv|6+>0yk2cpmm|257Q-Ir<tU
Zm*g9|yFm{(Xn%u}pFSCRSE1g8>0hcAv;+VE

literal 0
HcmV?d00001

diff --git a/src/__pycache__/__init__.cpython-39.pyc b/src/__pycache__/__init__.cpython-39.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..9f1a7a0866e72a66b9e1b0a522636a7980d2075b
GIT binary patch
literal 559
zcmZWly>8nu5GG|Qwv}3G)^_pg3`V*ZMbRQ&I;0JnbRh&B2$5lkP@+Im2I8m4Gj!|T
z_sGsQQ(vJ|k5+&LC<%VN?{I(L@x`JfcpiS=-#k)69us+aG9;hy`3-^~j0no8$XF&O
zA~%yOf`4K1wqONK_JKKQr);{nr)Jj9*_;wZ#Ox<!rI=rmRk?dxZg}9!&x2}Z7kJRN
zTVC+ymMdBAig)YN_37@-x3lld|HH1VHGgnUvZ9fmAXHykOuKNlk=|Q}p4TbsWo`5=
z&TMzB)j97l*sbPnf+bv@pg@QVFT>D-u}bMq#UmvH=u{Z4wUM5c#&R)wSn2szKH1fl
z8!dQv;<4(T?gI4ADu?rYT^+_LfUpffJOtQE=TR(@5`Yik#yYf%A!y^{(by1kM=ARm
z<1tp}82h}c{n)W;_KKh#C5<w$7dHmr7jef)TY|qQ&HMU?$If-9hC5krq`wWeuW`Y(
jcTEkTI~@Sl{au`WXssBG{FqkkD}+4HX`apKt8}w}gaoG$

literal 0
HcmV?d00001

diff --git a/src/__pycache__/config_manager.cpython-39.pyc b/src/__pycache__/config_manager.cpython-39.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..d6290821750ced85c33b66f8b42a4ec0aff26d81
GIT binary patch
literal 6334
zcmb7INsQda6=jiZ_A-lRU!<{2FEZ4IG*)8AaVD}XMO)-pGmaJ*YD_|Ky4Y=wy2*Bt
zl-xv*a~K6lfCxqa!-r%H%;cs^4nYn+=a^HFBM(8400D#?;<K~9U*z;Q6CvUZe;0o(
ze60WL)&FIWjg=H!e@uS%{yU3`@)vsOzcf6Y#~r*4!Ig@_8CM&u!sM@7QSqxaw5DFs
z8P(~HT+^r+&3q-_EK~~3Vx`EGs|wF?<AK7BZM9P3>P@Abk588_`d-bgN5T$W-!q%G
zXV)EJ)_h@dJG4zZsy7`kl(nVDc)hY(W{Li;9ll@I6aA7~4HNBx*G>v+EgHdYB)Quj
z3RP;`f93FS9(V9MQxr!5c!hvhH2%D!J2}U2@-=l)SyZ^TgHPbO2f0dt8$AC&sT7?O
z>PM)a7f@T|r3ZRtbVxhGN1+`X(vI<QXvc@NNB9J^M~1YMd<xo$A?-Aufp&68JIm*w
zo$6_wX+FQB@&&#K{Y;;}i@m4gM|U)Sj4z?(EPr9}`!UWl80R>D7Beu%P5vBaU|t&R
z#bhkC*Y(s+@u{>BnAHI@Hhi1AUfr}kZr-ySE=&oNkmW|whE@v(tg3zXp)%bU$wVh1
zI!ug)klV~NLU`3S>nIj;6-c$C>}q=oe2u(Fi-VGxUDrG}bn(L2F$aKl8*~d7L_JvP
zK2i5RWGf~)m>K$TNY~41%$nP9x;^5lwEZjT&vM&tHdf2Jpl=Wbh{Q;1l2MDM!%CmZ
zYN7{Dqb8d?Qp6})etD+4vVJ>oM6mAFqqeht$qDX;ertX0;*Iq{RM*q4R<<~nTkv+v
za`CB_Mg0Q<LdnlDLyhMyN<(D!S>A6}h0k{{TF$iK<y3!;LVT~IY%05KPZ5<6le;Mw
zIM*I(A1`gOP}|izY>%ct_nyLaUD1_ojVa#5SCrt~8JL0o?%)m$o}=EsP(D+)8Co2L
z#^~3;aQQtlAx84f>PlE>|C%XVDpTSY(Kg>v_xtv@yo0xHsUN9cDg8a8oPh?WFT_jl
zU~c=Zw9h1Dtb~a#b5U43{l+7f6dbSWlUJ@r$MMa7-ua<PeH}jJyEWlA&FEQb^7Gxl
zfBvzVd6G20>G>hZDf0M=86BlIpZ(OlEClFk-{(_ft(fIv<_6A(ZV(2E?zbE-(aBFL
z#lWsP(k(<0gCx0@aJ?{@w(3r3ai?ZSjWBbVq<Hzmsw26rtcek7&1wmAr01k!3`#);
zUBDg8Kq#upN^FX~%%;={HZK3-qeHII@0BbugcC->8*mhIny#a);(_>{Yg`9;fXnL&
z&;OF~0x#}pF5@L$s;e9%$U%Ah$W9LR6Q~EN@o5ms44(y^&Vi(KzOZA!e2ekoRVOsF
z4<58b{2cNBD<lFZd?gfEh%lZdwQdu;L=aEQhir>*xU7qhHvD=Z`&s>)$1>DqEh)NQ
zE5aPRA}RS%n3XF9)LPPI3c^o!n_K1LV{(+oXGwfW;!_g8A@K(iUqHC0FiGy)5OqA^
z`r<9TCGU9lM#JHWVSDw46I4c8!r!nr+=d&rAO8u>9-Aa+C04Y}R{gPsQaP85gtj0b
z2*6;K(uN&Y-<RcN(u<k{--9s&`<`QAr)=6`lK&tA?S<`fF4mVZV4Q<=>Ud~*BsZEZ
zs6w|^OZ022SJvX!PMoxZYUnnda$ue|Pn`7ZZn5Fqa~gfmO(zI2;pG7Am6Mf;k-qn_
zPM<-XccrXXMhN76U)%+iRgScTQ*-D8YIZgBMWxhoJ*(+7ebKJuqrkE1t*C6k_d&Hm
zGTLvfq=fmZ;;pcFWip6bEnkE%aQf09$-`WA)FmS=M@XetO;^MtCfCUD>X-+@mv9HC
zAQW9?`1_Y`O#DaH4Jy;$KlHqTb))`U&t;l_>VJ!$8(K97SLlHyL(4{TEAcY1A6%WK
zu3n9VKsYn#>SZQbKzswuhkz#~dS6N@mr)(iR4Zz{Fo>$x=l~cpkOVW10)g2@)aELC
zv~#NQ@vB&W{WCv^OneQU9;qowX?V+_80YEr{extHuc7lk;1dS{AJXF~(JvADo~I09
ze;uzE-z0I^#Lg1vUf&Gz^*+ci9E5zJ{Zj&-mw?INhp@i(M644MD|O3Yezy<i@k3zt
zHGN8il9032HH7i&PsBJy7_*KU%G-S?2g9-DgN>gO=QDC9dy9Vv>l;tRIw$9|*Ez#`
zrw{Lohs^4M4xqz))WRm@1mYMv4+ONt?cL4uT|C5dh-qjEGDK5|vMh#Zirqvs6{>CQ
zATkPC3N^0wqM-K>S8<JEABuO<l8k;dEZ<!GyKXpoTf!Ke1@pd(Al7s4Qw$zCy(qcc
z>tGO^ea?zWnHA+zqMZ(tRZvW9w_1&McMJ-hyAL;H5HS>3-x85yx-~N$f}259C2p@p
zjlN-SMKpuGa7s1?#b=+iVy<F`Nyf2(V1vvI7NopMVUL)D$O0tsEmBZ)Hq54DDTJ&$
z?YRL3&`L>V6U<1%q+^4YALxOtePjdiNH#$FB58TD_WnhbOW7vrg7Xj^wyW$ZTUy9M
zHPk4JJgmgoj`ky^CPS<Tqd!r8taP-Fx=lo_$0x4ScV|-=q$VLGgBAxqowSLO!anGg
zgp2S^;|?l>4L%8MDlj7czodNc(z?2(ZRzyxdy04m`GDHdfLPmB<&&P4fKKW=`nGIw
zR{3C}qmxdS2sJ}Kl;~9-`AW_Woo0}fT<qvUXk)idbPf+I=fo9&5LY261Pu`QCfZ#G
zJ*3YfZZC1iX{BaQ%_+lOT2LYG)PAf0`<ZM;EwT8_p#26NX8CNxuiA~^+;VSJByHa&
z3}miE3qm1if}o{fTU;hV4u$g!G67FPtdUwGxrkB=cbbK%1$DU?FFgqZSYsp$Jt_1#
zXd`-kmpLfhjAJCj<5@DS6N7AlLpIe-4FNg)<stH?5IGu!<~)b2?WHX>%xzNUg^Y^M
zFwm;-Fvk=yPH`ZA`~E=wR^X)$+t0wd>{M+33hbmIM_URDe59lGT7aF3TiQn&M>wCB
zBs&#h{n7ZhU0S$_NYy+v_8~qQ$g8`34sui9r1cVX3WBpmFgVcv&r3AK|6(Pg_?AsE
zTYwCbGC9k?o3Q(00(KFT5Ld*jkY%khwV$}v8vcDN2-`?N4cFu7TN$$(q>MZlIjFOm
zavd_z)KB(v))WY4B*H0N9~VO3&xGYt|0zR?F3C0TBB>EG1Zx%o>nm!uQi3FI6vUGI
zPJM$E^o~PWGEFS1@*v>{Xq2Xu;K(U9fpqdUb$p*I7YF^E@MqLGu$|{I2*tv*RD!=k
zq~|$sTAbj}K>>a>`UM$*gmC15^d5wyQkJ>bJraO6FSR(9>uJ#kXF+gyIABLbpHhD<
zv?EeG+OI_)9euRALPWQllf-ut#FyJLLZf4Zd63;F9Rs5wm))bXzFX+z_JHw&PcY_@
zjxK)BCw7Y+eUEu6pWI&(sFPp9r?3R3<74kqVn0aI*#DYM?5pvsr8l4Yif1pbtzNly
z_4bVmx2~<Nnm2D>zkcDyo%pLyJ<^-;<Tc8LO}LFi30ix_6iYBpoL|Ku2a@i1YE5Ry
z11+AR7Gt+$nrc#-ie8jd#fz&^a|1`Wer+J32vC0-_2MOnEAjm0G&3G<6RW4pL|^qi
zXBF-(9ri8iMaj1~N8(Kqlv0SdNqh$a>2(W-Dm>9Qeb+1JQ^uCDv<&_!d#TK3x%fba
zg5wy<Z`0*LAwX|yNoM3>%zliJ8S7KD2}}q@Env4PXazRM=DJeH{xio$)g?84esE13
zHW=-U_+Ox7Jc40aNy)OBK93qy9<?mW=Chi-WpTf1S%S81LCZ)`_@7b$C3W)XNA6y7
z;}VqXiWL%a%H-t9xjaw03lInre7_+s(KD?{L4kmvaHua}lCvUrI9k4ROcjuK6qv3q
zjTXk|o}JUXf5yV(%SVpS3u;*&5mo%8B&7OC)@he(xEm62VuWp+1JwKQ_P&d{ABG?)
WoJ}X^9HrI)?TtF7zQ9J=g8E+oB1upH

literal 0
HcmV?d00001

diff --git a/src/__pycache__/data_augmentation.cpython-39.pyc b/src/__pycache__/data_augmentation.cpython-39.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..8caddd18530dac3dbe49ec4c1fd0766da4a3f644
GIT binary patch
literal 5323
zcmcgw&2QYs73c74ce$%weOdlU>M}KYSfF(q$Ndr%$BJYdP94dR-KHfJu++}%iVC@;
zhg`>6a4(e$^b!=g^w7G1lw0n-w0}X)Jx-53=@y{3qG<cxaF_cb8E$(B?Rm@j<eT??
zzc+8>&COW~JlFpE>HflsqWldjlaB_K+fb5Uf}o0{P(sy!I7I%cjt0M4pofNI5bV<f
zGb}l!u<Vq>ic<+K#|o=XRraYt&8f+GbIu(68bLj5I1Sln2J_*9vk)#ii{X;96fQf<
zM7gKX5-mShX!%HWE>QK6(ya7vTbo|$*<P;`vTo|7e$=&FftMt9JL0w<dL1_1`E7f9
z>%q_Mo$bf#kMD19S*NfQWvfYq{?JSJn}*OI_(>{^$GtdUqP!jBl3pP6O}~{2ZM}O4
zW9#>E;fFkGu_TFjQx{ecdDNBP6IS9qWyAN&EzZ1@xkCjRb=!Wxx?adcJ?4Hlbz>fN
zI4sjbMJAszRBl5_{tSXCU}VKnDFGv2U^+9H*;X$rRC@ttrp9x_DY5cFg;^-6`9hP%
z(w!<@k?l1$hrckR0(};(!i+k-$Qtku`x?+wd!f@gT8Ex_dTH2$Uy{A@YYiANPZwas
zg4Chtnb2tQg-Vy`@^jr;luo)V=Fvy%6E5n%xiRA-dd7=0jzSlit*G1fJ1rFqGJ5bG
z%LbGLFso!FHhm>iTqPw(_zN}zsHpu<EPMFe@A|3l1%98|vzirSikEfXNmh#*u8?c7
zYHvtwdOSxR1$-b>_@RW}6e44fgU3_GlVYK*rpD`_E=M<uhC~ixVTdSI=m`tja>(Zj
zUw}dXc&oL#`;!C~+3j|EhirF~B_E|xyt}=zvzzeNF4}MeG^x||_)wHx*N5%8?mR4!
z=pdAmMf#U#H-3FIuBizl$FbpcJHP>xv$V&%EhPWwL8VP7(&`W3B_jti82kz_xvLJe
zfu8A9y`p3q%C<T%QgW<jMy68jL>rhXInXkanVFtxZ53)d)j!b(rK|+LGWuT>cG`)6
z)ojS*y+ga>KV@B8YF3OXUe5YT?qt=z-;H}|zDO|`T`AXDwdF@JbjZ5xcWugmlx*xS
z99+!Ykp`JTMXo5F`N-BOg0lk!o-f~N635z$IA#3(h%$&aMzZh4OlYmAH^fqhr6Wz=
z_fqaZyRj*(k3Al*x7&V~iTQW8cQ)_rxI1?qKDfWJ{`gL_%+alU8N~$<!rW(mXCLC%
z$39K>fiVyj8Fv~S%?LYmL%Fb1k`0VXWaVNJ=hyP~JbGP$mIOhnR2Rv-R@dr8|F^02
zzjg*Zld}NWsE=6a_QEMRCLH-Wg`)~I7*HgRVtC2a*ra5jc9emZDF@0i95B9eq9UH)
zUF#@R|BOK0NYzX|BAd#GKOC4DIo3`TKo5>FsClCDU!?l6kr^jsP|lQNGb?3fm{rQO
zW5C!6A<B~*nFd%Z_5W4)bv=%QLwjVZ>2o8EY|l=7WW<b%$J5V5idUfTjDc3|tzNjt
zxE-}eUuV>Q3X})eB{t}gA1B2pUkyt<&8C-=N{x|yioABpqg@MAav*6|POn18=^Bb>
zD1M9Lk0}0v;!6<zw+M*$K!_3?YI^~rcL9?K8KD81g~4GpCiGSWp~!>^jY0tBe&n}c
zmpIJy;+S=5voe9?H?U)Vd}QVtPk=a&!2BAHBfe89hDs95VtRSl?dI;wvHd2@mFI<0
zEfXD(J+IbCS*sC?)YO{V|K=HtpSKF0{8BqNhU`IDQ7?r+<5Hh<+(Zs|8FZnBPZdf5
z_y8&?giZiDIZ%%z$SLV5{7Of81V`7ghT##x4s<Y6Ju@WWZ$f}A4a%tjGfPyxsKCrh
zre>7`^EG8)r2zHJI#T(K%shs-A=pg-yXJiWzADhOo*&6Gz_u|%fk;Sg%wufGO?p8(
z#>;s2`EZw(ShX>mLcsbjiM(S=t=iktYBpGnwbE$%00sQd02VR-RWb)XE4hc}pcA~D
z(QE4zYzsLl$Dqa=AVf9wIM4uq*Ju1Dwp19X&LCxA9HAg|Oa(b+-5e3wtmZWM9yWX*
zg@loe?>C_8RHYKq#tDB5TM+y?q@Bjls6~od9X8+=W?8W~!gG#aoU;w<<(!zS6J$kA
z(}5RtVrj^V{<W8KV!Q@0q9T1RNig1m4E>W#z&#f!#IK<u?*d9l20Bpy_vDBS3?Fe1
zDMP9u_J0q-{}0*`1n+_is|6QI)VQeR<EVM0!5SF$%fJgvI4W6%-^?nRiR?HcYs!<G
zux<&)n{wT9zHWvrsd(|ZED3@k6fr^Y#&9hdQM{a!hae5mB%@qp40Z@+sRub)w{srS
zzgnKe5S67bi><u+gu#o^F!2o`nBzVo?st5+HI3{AaUg}nginxXbf^^{;*vc?G>|Z3
zJSBbeZq$Qd)L)!fZHQg|1HesxVHn587VKB8VH*&(zdV|l^jer+w|hZw*ena9m-<1%
zZ^0VEke4x`!QG7i2pV_|1s;AvOH$sna$dfTtz%HjsnrQ(MQIo=B{w<JSTu&p!rf1X
zl360o?RjZyf0QX<5|neWR#Sn4>asddmbJR7le)T0`d80zaB6x}<(sIZq}${@38`0t
zvVrSwfxv?YC<eJV67M<Gj@1)oQ#ry`4QYe9`bRn(Bk=Z`(nT5q0pYGWH5Trgy3C{g
zRJigUOYNi=hIkhmXEOOU>3=v*hC?Ae&yOIx&7;ts+HUd5SHtwtP@(ZXt(e?G=#3sU
zng%7of@aK=59<Sxo9m|vB#tVD)456DM#|Tr|8rHS*S`x0!gFHQxs|mJ>#}Dtzx6v9
z`gbTwf9;G55%NQn<XQUAde_&2sO1I8t?R`yk|yUW{0P=g@TBOV%C!N>2!}BGsrm%`
zGojZ#7&1|nX}`4=K%Ur&!uZxPcK;Ye|Ly-r&te@o2ri^>>j>OYG{{+<h?Tr~Obbb%
zM2t?P+ywGkEiR2YJ7u8+ZW(BNU}q09%BNn?V@XrbS&9sB>eC;08Z%#=HNmBqIpH_3
zT7C<%%49`TiAom9@<02{|JpnfD*zYye+jSTc<Q^Zuv|BcXfMF`n(IF4dBL!!<hnF!
zxh}^elD~@r*~^ze2(=rFQkQz1dxyek!=Ii~ZexcAe^BBGUYTrggtClb{4TyBKqhvL
ze^cP-eLe>Qi`*r~oJ-cq#n-Q1dE*;jmwn9@{sE4=3_=)?z{H3AXZT)1%m@CS{E{%!
zLyZ2p0vK;NX1e(fr1IavIXc`x_hot{|MbD%!7(yrl35UDMS1W=jm}e7l-F{j-9p+X
TxC31)L%vcYuY<(jOX`0B6u*8o

literal 0
HcmV?d00001

diff --git a/src/__pycache__/image_processor.cpython-39.pyc b/src/__pycache__/image_processor.cpython-39.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..93f0a66971a81c47e97ff7ce74af5194986183ff
GIT binary patch
literal 5218
zcmbtY%WoUU8J~SGDT<P9`faP*q%FiIH5?lOQXwep%8n|)kPXFc6ISVB#TiPgEO+VI
zrE4u#y~w8m1&RU%ipBxt+;r`^m!8|dU=D479t!;nxwPLmOAa5R;WS-hXXp8SGr#XS
z4Cd#n1fIu#{@w2F^Mw2h8{>}wjXUtBzl4I47NHu|Bdw*$uii4?YeZ((YFQeNnUURf
zT29w(x!p>uBKxeU+MR37b!)9!cfK{>t+(nLStHb@&T~SYL%p>?^$$tY&2LxNyTK0g
zdOT^fG!5e&uN?(x>U9$CZ3k)C_Ch%!=`kK;VG^g+6WAEpXllZI6lA+iLs*ady@(0-
zVGkz+kuV>GY1TAFHA({NO9G;r22a_bUVj=yAq}!&dtrxV<&fVABbK(2!}w!C;|{#(
zKcHX)z#uK1Y5>MHW-^Oe9sM$)#tVRhTF<SP%^c>k%3c+E?H4+AsQcV(&0)`IKDKD(
zg+Z%y4n}Ko6#HthVxHEaZ+@b0fi6N{9cV8|s%Pj~XfHzBVP}{Fyv_l&20ahGXX*7B
z+%CfSC3+clcy5C76?zrcG^9|LL|w|{Q7Mvy=Wngf6v>#(M$*|h*2G*Ea6~i>bJo@Y
zvEhStd{^O3>rfP0&!$>Id?HyJ`ERP;;8~BuECey-%$wYfnxQIp`A)i`TDX2}11sKR
zxf>66Bh{)@D9)e*^=<iAA<cH*_I6pgvzs*)ou+>BC2Wz;L$Sf<pls^GOj*?7HE0|Y
zz5t)E-f6FF{WN7f-HLbm`)unTOFzw$-qyp_&8?KTw<I@zfK|e8^!A18`yrgp_mOle
z0dn$-lc&5foC8d&0~(<1!saaN^LPSQG+BHltRFxn17Hue^hyRsTWFt=&-FtM3=>Q)
z(+hxm&p6Z%^g^e4pYU7QU+70>X6@N8!MLvy90T(-^S>!H9)KlzK}^9?+2AmxWvUsf
za#|dt{jYdvvtE`A%o@#2Ekwzw#-=>ylw2Pv=8O&~1gRJIyS;rc;5^v(z-??KG4sNX
z*9m|)RRr_KdMxdJjP;7Q@o&J3kS~)vO^3Ts6IPFhamH<^OF;`eNVEMO6MEbeP6u2{
zcKcS-;Hba+tXv__C)J@W7P0r7bUpwX2!9CK1sF(ilvG`<u9<pGb2Zag)blr{#6M#(
z@VpEw<)-*KsI^h(!w2i=rlb<!wlcB@!Y_3Af~)$i0Rq+Ye=0aOQU3ua>0Ln{rO8Mu
zQFBz~6(U{n*5h73n<)vk7Nz=1dwiAgy<Qc{{SUN2F$3>257J}2mqapL92>%DKfQ%^
zgXb01^^M2(H~qVt_wNp6I06+7dQ5_~a!nZ-egI>ot<L3Fr-U^=uc?<(k^-7`ekdd<
zAk=|EJ0h93r-RLDSBVtQu{y{`!n>vSD<#wmpRvdT{q3_9&F2?4-}c`5L`_$fuOlfn
z`SmEPZA=5r8*l<Z5H*@##NrYZ$9icN64EI&7vkZON<dd&ehFwbUz!4RYU+fyLrkY|
zq*{Xvv6MLeMIG@TQ?v$ZIt$5L@4ovDvGkS|eL9LAuLpK)U(?W@{0B}r4y~~IpwsX1
zH=uvo%bcO31D3dA02tyr6*_O6nmmClx<5<~rH1|yD*4Yca-?C*IMiNhGGb^DF_uE|
zbI{j9-!rz11LMFvut1m1mt@bPIz$h<Tv3>XQCOK>*c9STq3t=;d|~5ClVtAx?=^DZ
zXe9qmR-v%|Gsu(*2V#|pu?jiZ<YP!M51d~+9}d1Z$xWz%gq{4aO2TUl98e7TVpkfx
z7i=d(m!#&X$}7yn??F`hKV#Fqur1S1zVEe@I13=eLv~SG@7Vs-RyIOH7Rd>!bJG?k
z?m$>F7ZG-uiwL*98^ke-Qc=S|DHAHcyDjYUwE6Y>oI}8aTq~R8CG(tIU-6n%z61<}
z9d<bjs4&uu3oG3XAfB0N7G%On%S26BJn6?&*lEAh37?6|{by|^6KW3E1jyA#0k3p$
z--lk_#NsXFP*FP+8k^SA`Y6FhC^lh1>On!OI)p)2vmp@H4O`RY4?^Nsu3Og{T7G@X
zF-+2d+`kfH1oCOfMHS>esGkmx6=0^q<DZ~W=12#|4mmI}PXe7a4p9sB&*7_)%)s_N
z^2tYA`hf*HZ59?aE@B1+{nR`(G*XZwtAL#8z$qMRfn|L3WVz4_d(Q?daA6esaWr!a
zr*IE-zFe3`mBM`q^q(vPSF{w+ci`%jTniJl+YR6vMU<ip5^*nxqEekw(04EJ;LNO@
zC467aRFxTOK7?r)v(@TT+L|gd9y}vZSG<Q3;1Oe~W`k^Sn2=4bR-|U8b9hbjlFsn<
zHzeVqEsW^o_6Mk$UVe6Xe29Mot|tH#$<GWRQbv$&<a5<QCs55B!<A{jjrYt>KZ^Fj
zHc%_1dJ7|Bv8XUeCGnogL|tZqn78jhbWiyem?_LSfZ^}qA_v=c(Ce|7HY=rV{168)
ztcf{k_T^==wJ_K#qh*KCLYX&8GZJ$Hfbq=JX4BXXvi9!q@=&_>v<D2*Yfz9mFciI^
zFKP{=3Pz+GRs3l+9SrBqDZ`mX=~zFZK!#()7$leA6d+4FZ9W)qmHE6fyZpNn_bPas
zjCt8^zq=hn9*$C$n5Y@5GDBA}CmrhP<SNui+#%fR6ls~qe)B|fL}-!~zlzvgFR_uy
zzRYUYuy-o8S!~PW`s%oUfJwt-@mo`pn4UWkf-xGH@X8SEK?U8^9)w@2eX8?onSNvx
z;Hvh_mw0KzP^jl$C@5Ex_$lMVd>pJ~2d+eEI~coTskvVVc5iue?Z^L1R<kzbHzn*7
z)Ssrs--i#siG_?xZu@DrnnVc~_0@+D9&Y-;?$+Ao-H&IcIt>V`csxH#e08udfLMxm
zHBzlZC^@C~v(_{<`1gq4hc(Ufco|2l_I*+H{cb}05NCZ+^Zh6NAR3G~zE6|3?{hqc
zFz|YK25KCo#Zg=`0~St9<t0=)3;u2Fe-jII7{a8GAMp3EjfTYUVeu0z9$+!jC|Se%
z0mobn-xPCgwDn7s3m2E>8?{Dlap}T$y?HsKxyT>kY>B8P@4|!api7CuZMjWh!yOj<
zqdY>nXWRy)mRT63<!u*zn!E#-ei2#E+Lv(OFLC-2I^Puk3^5HC98e7+_9gwl;#L%A

literal 0
HcmV?d00001

diff --git a/src/__pycache__/utils.cpython-313.pyc b/src/__pycache__/utils.cpython-313.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..3ac51186b10210154a933cd9033de60d92dab316
GIT binary patch
literal 5478
zcmb7IZA@F&89w*R-!=x@K)&DxNQ;~13rNyrO&g#<AS9u_xcR`5XUxTM>aU%9od$2}
zP=8FcS{E8MimO$crFD~|O&VJ(EkE|7sV1#I?Km3jmTJ+KKauvsS(0|@{_H)+zQ!O_
zbw~KT=i@zJ?|JU?zK6$ly9Gh|*>4svU9=<gPg2p7xmtKU%^-9GNeCl}k=T<AW~gK_
z3z9p@jq#WlNgsbw7&BnQm=PPtOxQ%**pp^#rur6a1u2}gjoGms`gTZ$fI~6{SYMmI
z<eKc`CDT@PnZL|nr(_QBpl1m10w_R_h4kP?$x7Rspv6X8Tv8itvj>a;cfj4p5`7qH
z3Rr#5t<9~M=xhebQC+85YL^-|*OZ*FQe(gkb2asuq^9bK7D<#`&;x5p9(ooYdYh}g
ztx^l!-xk<kE8X8#X{WRWbhpB9Tfot0khWKKw?$ZQN5*UMtI=3gofBu%iLe??CKPct
ziN%?a8WKb4NL)^+A<}GlNX~HD%V_*WNWJ9cG=4m)sG2aDPQ_%+bS6c#LNQPfM&qG~
zteIoUNH8W}kz<+x%W4`Y!f>m#WP}n2zsLWA>;{^ub@<p?u~z6nQ^a&Mt!es^kIb?m
z9jw+5R_BqJwGlqk24$#rAc;L#-C3O`Md^C&4y4b$kCnJ1oLIkW+j?D6gIzoHR(*vo
z<mEHlB(O(H1Or8)iHI0ZCT63NG^U2m^zG^nDR32W*{g_q#9iHqP_0PKSyzwCiUPLw
zDj5&Cv0(j;?S<*#nuO{Vz^%qZs%E+rO3cJ$taweDvAO}xIvrA?;X%3$%@~p4%2lih
z=~PO_nsqoDlTTDeX?97)awx7>&7eCDrvNomFi18Q40;(%tgH}|irTZ`qXEAH>je^#
z^qd@cMOI!{lc~U&L0>?@;XoSTr|eD5X?BI!Bv{=NZh_Inq{>;y=FtP*y3DuS<y%%A
zp7$f!xnKPFgCCdL_m><8RvLyL*j&rD_Pe(Bf_S)OdtsGSciy$_EZI8C0@q~ux6vpV
zo;VS-Tesh}ZvXIH$@)xzf95evjWqL26w6^XiRaeglbnI#(?q#wAF$1<OoG{m5-i}Z
z9?4`DNIEvUD^(P_h>)Lgp%ZX|1m|acWVQ_nW~$+OtxID4oCEdNP^n`_ME~zB-}ZfM
zzQU>V2w4#zTjyd}Q(qsj%Vj!7WK|5sVq%nh<>D-W11JM0<6_N@ULnKpy_||<1jywG
zR8k3&PsdZxq(*0FHRd_5pc&+=Kp_f|s+^e7_(&`{jT^xbnn6ioRi5$kcnhgEO8$w7
zGrq~8SAxT5e5d*+CCy6L57PBD4rWkz&=euzW-_D!pc$;w!JW|B3O_}KY##lib)dj|
z?l-yTPp%l9%f^<Xv1Qq~rD)vpg{x~}aK+ZLY-=mp+5l^Be(>fJv(&ld$wy1=FWj>o
z*`)K2-rsva-o3P=u=nLs`|-cp`X33%z3Yhq*_sx2m#l3Cz73PrHA`hrDIn2xcr!pJ
z#oMo;a09i~bIYcT=tug!uqeU!naz--W0Lws@S!><iYUVFM9(7~t22P-Syn{taPy?^
z7}t(wnVo2g?20BM3c>D(MueM1m40Bdov(#rQJ@}KjLuRlh*3ohiC0K#1tF&=hv60p
zPiuTKB_}k)6&Xio=QQ)s)v!#xhL^=%q@Rn%BMLdIeuoY^56oV<NK8CxC;XH_$mUU*
z7X;6$z3JM8cP?Zt_w1cHWyRKTZS3u_pN@acAxGE!2G`dDNa%v%e^;&U$A}R;e`|1;
zIgsBdWWu+a`#F?t?BQ;ipzsGvKQjJ_gVG&DbI#K5<nA;ukZV>ogbA#aXhsg#UrNoH
zy$FW<E|<6F&epC`zfK?+mOvv?@3?9g0Xwdy4)`?d92Oz04N1Rln32)1Is^u+8?~vM
zJGZk=V-v?Fu}3(v%Ps^Esku0S$TmWCQ{)S#N#gv-fh3;N8Lyv@fJkBzVBH8nlE_)6
z1}P!q8Bd00MDRBvmWiROFoM9s9!;n+P9<X%N9i8I7($g8s1q+*;iGTZqoUWWap5aH
znjsnoXEmd73V1V9_=-B1j3u#VA3QUD#upqI@%8vd21sy1meDMurzeMe!G7ORKPJY~
zgcODa0lWm9csFgLi)f6zfov>f6IGBN0mbLxr_4h}K<X6S51g)>mg|-ed$XCJzg%+e
zUJzES&bN=PxLSZA8r?T-*KJw<M}x~<2a8<?OU^?J!dJi?EvxR9n`76<vgtp&{?c}*
zt>~Uu7`or!Ua<X#LYWoZt0sHF*_FGH8((6V4lH#R9Ea|i4zB{(%K~(NqwIi9yw%Zv
z2>q(x3HhBvmVs^DXQ*+Ynft6+fHFP|8k#kkR#Ry;NN7nj{vZwCuR0gzpi56Rh#&fn
z5ck)^jMt}GlQnR1z+Icb+gI~IYhxgqhxfn{c3tGPDTJrsZBa>nMhBjstAlk7wz?j8
zYjz)duzF@-LBfAdy|)T(e#)h{0Js?nZXP`8dT<K~zMqd6Br5B`ZOk-Dp(|BHi)xZG
z=A@U^jHwWYNL$fN)FlR!uV-8pbSt4NYv9IvVe!+$UJKp_1>6Ifj%Gk|4<K4IRA$nI
z`0L=0HDfgX29Cm4bAaf&M^BygjZO{)$0mkGg0K4f$44j6Q?TPh(C-x}81PXt`S-{G
zbH!OrM=*W?>Iw-~z{BeNY=PbB+&lzb$BE8QAS1B137!Xl-|_3?InQso<?bWJ?jt4l
z(FJqafXwb?)7GMC>#|8Kn#8>OHeVp6WAHVYZP%>tSl=JaT1)P(T=bL9<({!(&)DZ9
zg#(lKO#YPymkxdp1%GGmWbW8{@VhDaf!>M3eXD<ee=oYzYZ++e?i_0zaB-ix1So6v
zB#uJ(9g0;zFGLeF@>K{t(zCPCtLvaoPEBC(_%dWS5Cm-?H>Lz9F@6>R0j^kL8vqhC
zP^|Y7)ggopi6+dm$!7sz;`Ue(qQO?@AP^WhR}$rr=$gLGszJV7b+8%})VTdUGvrC8
zsB#=1hjs7?$bh<rNqIzXz~fNbKwVqHbP4_GAkWZ{iY$gtf%XI$L1vjp_pPnV)*VIb
zj`>$s8k~#Gi>54--Ie3A+Y0tw^TR8oyS->_&rRlr^M~@?OUIUbM~b~8g`N|Ij?toZ
zw7`#6Vjwd)4>kL`5Qx}{+WAE&P&)(FY)pDcv)MCIVyc#7GcFRQl4Zn-4@rop2BHW#
z5qxc6CU^-Mm5L*W_sVHlr1D;=#Ewql<mn#C;9z_jlN*1HXl;dzn8JPSrMF)yS+^})
zJB!xN+z*S^-U8oSIi4|`#^iI>1U0FK;Q5=v@<vP%dZK47LjnHP0e*0*cG{^b2_bZD
z{~kbJU9?amGjdX$*mRlT*G9r40)5+9iK`K?03Mnrx{`3NZx7HZDer-OB@9!9_Gyv~
z6x~L@0Wfaz3y_<scehX)wDwvhn`9@{e2zJK4xte2Z*8=GYe1`xh{M~EX__F;RZQVz
z1pKcePKWSA!e^1nYUhtXB-YTFV;ZwZW9%93s5q5jFNzs%m)NZ_`!vR@A&3b$csQK)
z@(?=`d*fsp-VwqqxMQ_KX+|u;Jb031elnv4R)T*^BqHGG>~P01Kzy}og6D3S(l7@~
z3OPC@JDu(vG$07-d&Xq17vQJ73mJf-(KSB?F8f0vd%4)w^NIiV!H)yQw*FG<K*>Eg
ze`>YCz39)LeJ}V?I`9AGkBXk&rB_Q0hv!eMSnP}TqGd;p%Vmns_7}y0qGe!yaFsVN
z3@lt(xU?9~c4j@<>0E2hlJCq%^5>UAw}quQZifn%<DX97<wsYHj*_tj`0!n0nM0;l
zibJptKYDujjF*9b+dK@y9*MnxJwTWys)qM&*Nnm7Ofnn{YHU)$#4Qqcq+W_er!m2y
zW>Du+;DazBD@?c$6K_pjkR~M3ad^D5iIm1ojE>Vdzv62QmH!LShdh0IY5a6D8KW^g
z{yt2g851)hj6-vnL`-;yWQ1|>G|9*ZM-6-n(Zf_eOw)_;<V-pyzl7g_eu5Ci2029Y
z4D*O(8UC>WF_tfo<4e@~chp@(-CrQ6Hhqaak9Z67Y*s2G5c$aO61NghNwM5&X4<oA
z8G*?2`N><BC!|<zHZmU43?k1zA>vU}6XVYIl@W-%yfk>*wRGZEl2$)&E%+vveSsqU
zjb408G#+(37|-JL&CBmyE+Z)BVJ;B2!&H3U_mtEgi99pL<R{CB$lIM2`KeNog|kyn
mX-C<{GJQF|j6mc)Pl$MAGBM8VU>SkPb5txzUy&NM*8czvf|n}*

literal 0
HcmV?d00001

diff --git a/src/__pycache__/utils.cpython-39.pyc b/src/__pycache__/utils.cpython-39.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..b62b19a15b19d1660e5af26da604618214e16804
GIT binary patch
literal 3426
zcmZWsTXPi074Gi2>_yr|hy@Fa*aMi$5Sw5^B`$&;gOG?4At{nD#YEK9XuEeAF}t(w
z=~dXRmCIG4@<x((pbF(Jm47s^dEzgqDye+kvjPQ=YWs4!`*ipD&iPI&s@19l-(Uar
z_a~2Qg#24~j(#pW-{O}MN(d(b;gqw42GrCnV5qIc>ezuz^_ZPF9XD`0rJ&R)2W2B;
zNhPS5`PE<owUbPCYC#QS=R{qw?PI+3it#e9Ja>XAVGCE-rwOk@Ho+&K+re?jrg;th
zIzNW~34R`ul4yuVi=8H-EGD*3V#U-eiy!CH&~l1@re&Dbz{<ueo1f&TApeM8FtWO^
z`3$6|`NxpXKz5qXLjM{5GwA=AU(~uqoqr0A9zTmYvz)CH|I*N}K2UKItAW?*cbh6s
zyP4NYrN<)`c~QUJ5nUB&arLb><FZe4do@x|d@Hw?;!NevM!%Pcyu8xWv!VnOoW)Mm
z7P-B+ys+Z4ypp8tFcCW<$z3T_Uv`_Y{ku=MH7axXW!F(CvP~6JWJKOr`(zJ@DDuYU
zY+u*TK4~*<y|5_ey>V4(pW+_&aCRM<dmgrG$KAHqOuMbP-IwO*!y6YaM;R{H5q{=<
z;a#}gjovlQ!H)DhBFk`kKO3IZHVBW};40MP;?DRouu~^edHG4y<%y7)U(QS80|XOW
zQ5HAn%rWv(Tfm4)=1#xY6Ec`sh!gR<VpULES5ics!)^t0mv9Rq^KuyKgN30_Wf_L~
zCy~cd9b9VO+<cH>!_98HKM<RDMfOysz0H-mwarX6H~T;|yV@J%wM-i&9G_`Y8+Zx@
zVK$wljFqYTU-lojEKfkDf#R_gO_j=ltU&UADA^F`GZ>V<L!*u8_y^skZL-UN6xk<o
zc|`A$$2WGZ5qm=+W1Nkwm*h2&+ozNqm1<<)k9<F)>=E13NLs^l_k{AIB=KVHMP3W0
zf=kM@<Gnkc?+op$+r9SCK`Gkk^t!s->hvH|ajTWnE54Jv;u%~t)3p*^p4;st-IB*}
z`rOS@sRZ|J*+4fqzW!i!b!Ba1{%*LivUdOW#(F+s_7Bbefdvi5_(d_TRU89S;gLx*
z5N350gq308GX74{GgQt(0_#?bsXYYGPtD6P=bd@i&>4OO_l6Po>EC8{>4?5z`(Uhx
zFuF}_vIqC?PJKzTE7u^^e~*e$1hq|+HCQ^7a%-Jj!zvRbXTOV*7+x*BxMd9M#hDj*
zJ6c+pdwF94Ceh)T+i6d919wNrxHZTt^Us>Xgt*V-8H@*3+-ZMklDbia4GO!Q$Gl9t
z9bpU}cagd%<)`TTmQj*Vs7PuvX7NxIR?(I?{It_)IyX-D7c_<o+A0bTw+EMk<AEId
zM1G>}vaSgMt_S+C_Zh~hyo0tgLJPIa*$Ydrcu0(mN`oIM*@Yd4=Tw<nBe)~Cjl0@=
zaMp*gD5tyD50=(kw5}am(ixsyN+a$ef;}np*~ixNX;6#1O2}TC6x7q0mlAZEV7lg|
z!lw_|P0z37R&(ci;Km(<KhLcU{7`Q0sJS#rWl)=2Sz1{O@7!CvzIN|U0OHi!1l7gm
zjrq0k_S*by`3Ve?J3WaFftkicdPZb6$*K4dovJ=Xfz0Qan4LlaWLO=Z>RNTnrqj%&
zb=sivGDhBpD4_Wws(d2tt6pD)+I{oV_kFmG8q<V@@x#wS;~ionbcVMIKL!E}s8}Pq
zZEf2~nn=4Zm?3dTxg)wqM;7LkMy$>Dfl7fWe7QW>0ZvH9z^MY9sKLnwdA!HT*|mSL
zxeJ_3%i!d|<4eQo^=M}dj;B)N^Bai8QZJH7Y*}753=yVJhbIc4vS{Z$PVy{nu)N?`
z<vBFuXDAMV0Vvl2PVN?(a;NhY^c0lh&Yxur2hgq`G#2kaTwC0j4}ZTpe=q#wgWF4s
z8;=Zb@&d+v$Jkb0(aL|W7gP$4*lJ68NeeaIA7Pv-PB#v%Z!t0^a{y>fSu+SO1Kl-@
z<QCGFZ|AjC#>j_JQsCyqT`r!1`}(a`{H%z#qv+{)(+HY)(|Sf^8!^J^h{5V$A<kaf
zuWe2E+raB3C>=i_3pA`*#1-iK{2bgF45N8dXD{=b7$;FNW|^FZfpzUV*N=!yiH^LA
zz2prPa5wz~kiR?>$Y1H!2X;8!G<zK8X2A_h>)lo{JJa+<;K|ce{u(Wv+4O0Q4Sq_!
z`u(9v$6Q*|cahDu;iBeBY<NOvB(1?KLcQzVzY`NOr8VRHcmkBNg2Irfzk-Gj&pV|l
z&KyB22s>Lkfo6v3nEVaed3jZ)ZNzv6la!i$sl79IRH`C8ntD<IuI5psN?4?c)g1ac
z8k(ULQ9xxx8Uzf9h?)gU?$KRa0k@-4ZtbyM2W)3I5HVO`&tT0*WY<*|cMaC1kqgAj
zBL`*0aAVa(-o$G>VR=nQ?ud-&Qzm~@)*f;XuLJ#K!|7E`M_zAy8*eL;Z#AH8{O~>c
z_N_Me0sZ=besMr+L+hsZry+an4Xq2_<pcVQ1M24lPe=>tdKnIEL0j&~w2$oVw7_4g
zh@6uA8hYe6y7(=Mpo*RF$n3V&lb{AuCvb{!w~QxOQ%8GXVbX`#)D3}#hbIo8Y@Ebx
zI)en>pr3;t<r3sTSKHmEcm+$p5PVrww{&$TFNGmbn_-x<G?V!EgJ`BvPm*{`YP54#
z4SJv#siBlQ+N2IQ!!Ci-?RR>EfOUI;wYs=ul5jyIZt)&8&ouLz$nC8(O-v${i%<}h
zx*Ru)28Oq#j$GsU@(;SD9n75n$kk0inO98tRww2CM0}%x$#hP!E&X(v#LZ338k3EQ
Osmi&=%+x7&%Kje`FF>yV

literal 0
HcmV?d00001

diff --git a/src/config.py b/src/config.py
new file mode 100644
index 0000000..2231176
--- /dev/null
+++ b/src/config.py
@@ -0,0 +1,40 @@
+"""
+Configuration file for data augmentation
+"""
+import os
+from pathlib import Path
+
+# Paths
+BASE_DIR = Path(__file__).parent.parent
+DATA_DIR = BASE_DIR / "data"
+INPUT_IMAGES_DIR = DATA_DIR / "dataset" / "training_data" / "images"
+OUTPUT_DIR = DATA_DIR / "augmented_data"
+
+# Data augmentation parameters
+AUGMENTATION_CONFIG = {
+    "rotation_range": 15,  # degrees
+    "width_shift_range": 0.1,  # fraction of total width
+    "height_shift_range": 0.1,  # fraction of total height
+    "brightness_range": [0.8, 1.2],  # brightness factor
+    "zoom_range": [0.9, 1.1],  # zoom factor
+    "horizontal_flip": True,
+    "vertical_flip": False,
+    "fill_mode": "nearest",
+    "cval": 0,
+    "rescale": 1./255,
+}
+
+# Processing parameters
+PROCESSING_CONFIG = {
+    "target_size": (224, 224),  # (width, height)
+    "batch_size": 32,
+    "num_augmentations": 3,  # number of augmented versions per image
+    "save_format": "jpg",
+    "quality": 95,
+}
+
+# Supported image formats
+SUPPORTED_FORMATS = ['.jpg', '.jpeg', '.png', '.bmp', '.tiff']
+
+# Create output directory if it doesn't exist
+OUTPUT_DIR.mkdir(parents=True, exist_ok=True) 
\ No newline at end of file
diff --git a/src/config_manager.py b/src/config_manager.py
new file mode 100644
index 0000000..62d612f
--- /dev/null
+++ b/src/config_manager.py
@@ -0,0 +1,175 @@
+"""
+Configuration manager for data augmentation
+"""
+import yaml
+import os
+from pathlib import Path
+from typing import Dict, Any, Optional, Union
+
+class ConfigManager:
+    """Manages configuration loading and validation"""
+    
+    def __init__(self, config_path: Optional[Union[str, Path]] = None):
+        """
+        Initialize ConfigManager
+        
+        Args:
+            config_path: Path to main config file
+        """
+        self.config_path = Path(config_path) if config_path else Path("config/config.yaml")
+        self.config = {}
+        
+        self._load_config()
+    
+    def _load_config(self):
+        """Load main configuration file"""
+        try:
+            if self.config_path.exists():
+                with open(self.config_path, 'r', encoding='utf-8') as f:
+                    self.config = yaml.safe_load(f)
+                print(f"✅ Loaded configuration from {self.config_path}")
+            else:
+                print(f"⚠️  Config file not found: {self.config_path}")
+                self.config = self._get_default_config()
+        except Exception as e:
+            print(f"❌ Error loading config: {e}")
+            self.config = self._get_default_config()
+    
+    def _get_default_config(self) -> Dict[str, Any]:
+        """Get default configuration"""
+        return {
+            "paths": {
+                "input_dir": "data/dataset/training_data/images",
+                "output_dir": "data/augmented_data",
+                "log_file": "logs/data_augmentation.log"
+            },
+            "augmentation": {
+                "rotation": {"enabled": True, "angles": [30, 60, 120, 150, 180, 210, 240, 300, 330], "probability": 1.0}
+            },
+            "processing": {
+                "target_size": [224, 224],
+                "batch_size": 32,
+                "num_augmentations": 3,
+                "save_format": "jpg",
+                "quality": 95
+            },
+            "supported_formats": [".jpg", ".jpeg", ".png", ".bmp", ".tiff"],
+            "logging": {
+                "level": "INFO",
+                "format": "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
+            },
+            "performance": {
+                "num_workers": 4,
+                "prefetch_factor": 2,
+                "pin_memory": True,
+                "use_gpu": False
+            }
+        }
+    
+    def get_config(self) -> Dict[str, Any]:
+        """Get current configuration"""
+        return self.config
+    
+    def get_augmentation_config(self) -> Dict[str, Any]:
+        """Get augmentation configuration"""
+        return self.config.get("augmentation", {})
+    
+    def get_processing_config(self) -> Dict[str, Any]:
+        """Get processing configuration"""
+        return self.config.get("processing", {})
+    
+    def get_paths_config(self) -> Dict[str, Any]:
+        """Get paths configuration"""
+        return self.config.get("paths", {})
+    
+    def get_logging_config(self) -> Dict[str, Any]:
+        """Get logging configuration"""
+        return self.config.get("logging", {})
+    
+    def get_performance_config(self) -> Dict[str, Any]:
+        """Get performance configuration"""
+        return self.config.get("performance", {})
+    
+
+    
+    def update_config(self, updates: Dict[str, Any]) -> bool:
+        """
+        Update configuration with new values
+        
+        Args:
+            updates: Dictionary with updates to apply
+            
+        Returns:
+            True if updated successfully
+        """
+        try:
+            self.config = self._merge_configs(self.config, updates)
+            return True
+        except Exception as e:
+            print(f"❌ Error updating config: {e}")
+            return False
+    
+    def _merge_configs(self, base_config: Dict[str, Any], updates: Dict[str, Any]) -> Dict[str, Any]:
+        """Merge updates with base configuration"""
+        merged = base_config.copy()
+        
+        def deep_merge(base: Dict[str, Any], update: Dict[str, Any]) -> Dict[str, Any]:
+            result = base.copy()
+            for key, value in update.items():
+                if key in result and isinstance(result[key], dict) and isinstance(value, dict):
+                    result[key] = deep_merge(result[key], value)
+                else:
+                    result[key] = value
+            return result
+        
+        return deep_merge(merged, updates)
+    
+    def save_config(self, output_path: Optional[Union[str, Path]] = None) -> bool:
+        """
+        Save current configuration to file
+        
+        Args:
+            output_path: Path to save config file
+            
+        Returns:
+            True if saved successfully
+        """
+        try:
+            output_path = Path(output_path) if output_path else self.config_path
+            output_path.parent.mkdir(parents=True, exist_ok=True)
+            
+            with open(output_path, 'w', encoding='utf-8') as f:
+                yaml.dump(self.config, f, default_flow_style=False, indent=2, allow_unicode=True)
+            
+            print(f"✅ Configuration saved to {output_path}")
+            return True
+        except Exception as e:
+            print(f"❌ Error saving config: {e}")
+            return False
+    
+    def print_config_summary(self):
+        """Print configuration summary"""
+        print("\n" + "="*50)
+        print("CONFIGURATION SUMMARY")
+        print("="*50)
+        
+        # Paths
+        paths = self.get_paths_config()
+        print(f"Input directory: {paths.get('input_dir', 'Not set')}")
+        print(f"Output directory: {paths.get('output_dir', 'Not set')}")
+        
+        # Processing
+        processing = self.get_processing_config()
+        print(f"Target size: {processing.get('target_size', 'Not set')}")
+        print(f"Number of augmentations: {processing.get('num_augmentations', 'Not set')}")
+        
+        # Augmentation
+        augmentation = self.get_augmentation_config()
+        enabled_augmentations = []
+        for name, config in augmentation.items():
+            if isinstance(config, dict) and config.get('enabled', False):
+                enabled_augmentations.append(name)
+        
+        print(f"Enabled augmentations: {', '.join(enabled_augmentations) if enabled_augmentations else 'None'}")
+        
+        print("="*50) 
\ No newline at end of file
diff --git a/src/data_augmentation.py b/src/data_augmentation.py
new file mode 100644
index 0000000..430ee79
--- /dev/null
+++ b/src/data_augmentation.py
@@ -0,0 +1,161 @@
+"""
+Data augmentation class for image augmentation - ONLY ROTATION
+"""
+import cv2
+import numpy as np
+from pathlib import Path
+from typing import List, Tuple, Optional, Dict, Any
+import random
+import math
+from image_processor import ImageProcessor
+from utils import load_image, save_image, create_augmented_filename, print_progress
+
+class DataAugmentation:
+    """Class for image data augmentation - ONLY ROTATION"""
+    
+    def __init__(self, config: Dict[str, Any] = None):
+        """
+        Initialize DataAugmentation
+        
+        Args:
+            config: Configuration dictionary for augmentation parameters
+        """
+        self.config = config or {}
+        self.image_processor = ImageProcessor()
+    
+    def rotate_image(self, image: np.ndarray, angle: float) -> np.ndarray:
+        """
+        Rotate image by given angle
+        
+        Args:
+            image: Input image
+            angle: Rotation angle in degrees
+            
+        Returns:
+            Rotated image
+        """
+        height, width = image.shape[:2]
+        center = (width // 2, height // 2)
+        
+        # Create rotation matrix
+        rotation_matrix = cv2.getRotationMatrix2D(center, angle, 1.0)
+        
+        # Perform rotation
+        rotated = cv2.warpAffine(image, rotation_matrix, (width, height), 
+                                borderMode=cv2.BORDER_REPLICATE)
+        
+        return rotated
+    
+    def augment_single_image(self, image: np.ndarray, num_augmentations: int = None) -> List[np.ndarray]:
+        """
+        Apply rotation augmentation to a single image
+        
+        Args:
+            image: Input image
+            num_augmentations: Number of augmented versions to create
+            
+        Returns:
+            List of augmented images
+        """
+        num_augmentations = num_augmentations or 3  # Default value
+        augmented_images = []
+        
+        # Get rotation configuration
+        rotation_config = self.config.get("rotation", {})
+        angles = rotation_config.get("angles", [30, 60, 120, 150, 180, 210, 240, 300, 330])
+        
+        for i in range(num_augmentations):
+            augmented = image.copy()
+            
+            # Apply rotation with random angle from the specified list
+            if rotation_config.get("enabled", False):
+                angle = random.choice(angles)
+                augmented = self.rotate_image(augmented, angle)
+            
+            augmented_images.append(augmented)
+        
+        return augmented_images
+    
+    def augment_image_file(self, image_path: Path, output_dir: Path, num_augmentations: int = None) -> List[Path]:
+        """
+        Augment a single image file and save results
+        
+        Args:
+            image_path: Path to input image
+            output_dir: Output directory for augmented images
+            num_augmentations: Number of augmented versions to create
+            
+        Returns:
+            List of paths to saved augmented images
+        """
+        # Load image
+        image = load_image(image_path, self.image_processor.target_size)
+        if image is None:
+            return []
+        
+        # Apply augmentations
+        augmented_images = self.augment_single_image(image, num_augmentations)
+        
+        # Save augmented images
+        saved_paths = []
+        for i, aug_image in enumerate(augmented_images):
+            # Create output filename
+            output_filename = create_augmented_filename(image_path, i + 1)
+            output_path = output_dir / output_filename.name
+            
+            # Save image
+            if save_image(aug_image, output_path):
+                saved_paths.append(output_path)
+        
+        return saved_paths
+    
+    def batch_augment(self, input_dir: Path, output_dir: Path, num_augmentations: int = None) -> Dict[str, List[Path]]:
+        """
+        Augment all images in a directory
+        
+        Args:
+            input_dir: Input directory containing images
+            output_dir: Output directory for augmented images
+            num_augmentations: Number of augmented versions per image
+            
+        Returns:
+            Dictionary mapping original images to their augmented versions
+        """
+        from utils import get_image_files
+        
+        image_files = get_image_files(input_dir)
+        results = {}
+        
+        print(f"Found {len(image_files)} images to augment")
+        
+        for i, image_path in enumerate(image_files):
+            print_progress(i + 1, len(image_files), "Augmenting images")
+            
+            # Augment single image
+            augmented_paths = self.augment_image_file(image_path, output_dir, num_augmentations)
+            
+            if augmented_paths:
+                results[str(image_path)] = augmented_paths
+        
+        print(f"\nAugmented {len(results)} images successfully")
+        return results
+    
+    def get_augmentation_summary(self, results: Dict[str, List[Path]]) -> Dict[str, Any]:
+        """
+        Get summary of augmentation results
+        
+        Args:
+            results: Results from batch_augment
+            
+        Returns:
+            Summary dictionary
+        """
+        total_original = len(results)
+        total_augmented = sum(len(paths) for paths in results.values())
+        
+        return {
+            "total_original_images": total_original,
+            "total_augmented_images": total_augmented,
+            "augmentation_ratio": total_augmented / total_original if total_original > 0 else 0,
+            "successful_augmentations": len([paths for paths in results.values() if paths])
+        } 
\ No newline at end of file
diff --git a/src/image_processor.py b/src/image_processor.py
new file mode 100644
index 0000000..46c3111
--- /dev/null
+++ b/src/image_processor.py
@@ -0,0 +1,174 @@
+"""
+Image processing class for basic image operations
+"""
+import cv2
+import numpy as np
+from pathlib import Path
+from typing import Tuple, Optional, List
+from utils import load_image, save_image, validate_image, get_image_files
+
+class ImageProcessor:
+    """Class for basic image processing operations"""
+    
+    def __init__(self, target_size: Tuple[int, int] = None):
+        """
+        Initialize ImageProcessor
+        
+        Args:
+            target_size: Target size for image resizing (width, height)
+        """
+        self.target_size = target_size or (224, 224)  # Default size
+    
+    def load_and_preprocess(self, image_path: Path) -> Optional[np.ndarray]:
+        """
+        Load and preprocess image
+        
+        Args:
+            image_path: Path to image file
+            
+        Returns:
+            Preprocessed image as numpy array or None if failed
+        """
+        if not validate_image(image_path):
+            print(f"Invalid image file: {image_path}")
+            return None
+        
+        image = load_image(image_path, self.target_size)
+        if image is None:
+            return None
+        
+        # Normalize pixel values
+        image = image.astype(np.float32) / 255.0
+        
+        return image
+    
+    def resize_image(self, image: np.ndarray, target_size: Tuple[int, int]) -> np.ndarray:
+        """
+        Resize image to target size
+        
+        Args:
+            image: Input image as numpy array
+            target_size: Target size (width, height)
+            
+        Returns:
+            Resized image
+        """
+        return cv2.resize(image, target_size, interpolation=cv2.INTER_AREA)
+    
+    def normalize_image(self, image: np.ndarray) -> np.ndarray:
+        """
+        Normalize image pixel values to [0, 1]
+        
+        Args:
+            image: Input image
+            
+        Returns:
+            Normalized image
+        """
+        return image.astype(np.float32) / 255.0
+    
+    def denormalize_image(self, image: np.ndarray) -> np.ndarray:
+        """
+        Denormalize image pixel values to [0, 255]
+        
+        Args:
+            image: Input image (normalized)
+            
+        Returns:
+            Denormalized image
+        """
+        return (image * 255).astype(np.uint8)
+    
+    def get_image_info(self, image_path: Path) -> dict:
+        """
+        Get information about image
+        
+        Args:
+            image_path: Path to image file
+            
+        Returns:
+            Dictionary containing image information
+        """
+        try:
+            image = cv2.imread(str(image_path))
+            if image is None:
+                return {}
+            
+            height, width, channels = image.shape
+            file_size = image_path.stat().st_size / (1024 * 1024)  # MB
+            
+            return {
+                "path": str(image_path),
+                "width": width,
+                "height": height,
+                "channels": channels,
+                "file_size_mb": round(file_size, 2),
+                "format": image_path.suffix
+            }
+        except Exception as e:
+            print(f"Error getting image info for {image_path}: {e}")
+            return {}
+    
+    def batch_process_images(self, input_dir: Path, output_dir: Path) -> List[Path]:
+        """
+        Process all images in a directory
+        
+        Args:
+            input_dir: Input directory containing images
+            output_dir: Output directory for processed images
+            
+        Returns:
+            List of processed image paths
+        """
+        image_files = get_image_files(input_dir)
+        processed_files = []
+        
+        print(f"Found {len(image_files)} images to process")
+        
+        for i, image_path in enumerate(image_files):
+            print_progress(i + 1, len(image_files), "Processing images")
+            
+            # Load and preprocess image
+            image = self.load_and_preprocess(image_path)
+            if image is None:
+                continue
+            
+            # Create output path
+            output_path = output_dir / image_path.name
+            
+            # Denormalize for saving
+            image = self.denormalize_image(image)
+            
+            # Save processed image
+            if save_image(image, output_path):
+                processed_files.append(output_path)
+        
+        print(f"\nProcessed {len(processed_files)} images successfully")
+        return processed_files
+    
+    def create_thumbnail(self, image: np.ndarray, size: Tuple[int, int] = (100, 100)) -> np.ndarray:
+        """
+        Create thumbnail of image
+        
+        Args:
+            image: Input image
+            size: Thumbnail size (width, height)
+            
+        Returns:
+            Thumbnail image
+        """
+        return cv2.resize(image, size, interpolation=cv2.INTER_AREA)
+    
+    def convert_to_grayscale(self, image: np.ndarray) -> np.ndarray:
+        """
+        Convert image to grayscale
+        
+        Args:
+            image: Input image (RGB)
+            
+        Returns:
+            Grayscale image
+        """
+        if len(image.shape) == 3:
+            return cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)
+        return image 
\ No newline at end of file
diff --git a/src/model/__init__.py b/src/model/__init__.py
new file mode 100644
index 0000000..ecb9162
--- /dev/null
+++ b/src/model/__init__.py
@@ -0,0 +1,8 @@
+"""
+Model module for YOLO-based ID card detection and cropping
+"""
+
+from .yolo_detector import YOLODetector
+from .id_card_processor import IDCardProcessor
+
+__all__ = ['YOLODetector', 'IDCardProcessor'] 
\ No newline at end of file
diff --git a/src/model/__pycache__/__init__.cpython-39.pyc b/src/model/__pycache__/__init__.cpython-39.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..231b3dd8b9512918438d45b615e8fac91c63120f
GIT binary patch
literal 352
zcmYk1&q~BF5XPIf+g(bF_y#%JgW_2h5w@2FwTt4x5*TVG)?(U}q<g4u;bVC8QM~r*
z$%_x*$;1_LAYbN#`OTjyO=Hi->*w>soBiLN`5(SDXZD!`E9jLT67(f${n95c4`k4W
zWoYvdXSH9>FuL}#`O`AKP$(pA6>g=V_e#^-;=DM#tBgRp&MB`nQWS&WL!&xcbx65Z
zecyC-{6Xxnj7*6`@}C-|t>0VcD~oNk;=&lEwcAbyRxYz>nggKX08=_DsbJUpw`kgL
z5Zp-U|6s>CsFD)k#nTJd%*od=KVdgUXv4aCI|`Ny^EjxU6{{;|G-viGAsIl^H3Ps=
UKTeC~?$A@WxrwZVVL}rB8^woVj{pDw

literal 0
HcmV?d00001

diff --git a/src/model/__pycache__/id_card_processor.cpython-39.pyc b/src/model/__pycache__/id_card_processor.cpython-39.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..23bc067fee657c3ad34ecc93b4013fd3d5b3b80b
GIT binary patch
literal 8960
zcmbtZ-ESP%b)WCqZ&DOZQI<c(j%;~VM{$+FNm$i3MbQ#lg%T(lvbTx{%e}+pkh34Y
zGb@Rcp-@0J(iU}*7H-fW3b1U000!Fr6-6KVRP>=J?px6(z4p;S?f%Z4+1cfit^;%l
z-kE#n-0$D{-E+=uR;wiiKlQ)=a_1M{Rh0jt%;Zl;<{kWpTS%DFP?*ZJKy9e<sWo&w
z^}y(u4O69WMqqX9hTSPN3Y}u3*eNwiopPfrziC0GQDG*tf@-JMsHw_zh1sm|vBC<E
zwZ;t7?kM$Qe5JH@%~@%3=G^AJmKTOS?rh_KtJ&IX^WLD#9PV{`_nU#!#CxB6{Z!8H
zwo6YjN@cyS3gdP&+Nqnuxao(HDBS8tey`gMgmKMpMM7Wh?hA8s&=0()Dr%rY<%3%{
zZ(Z{uuNC!pi<+7I(IUNr|8N%Ko`UHs4UMUo{!5<WnP(NIKf&ag`LWrs*vp>1TkwjM
zGW&_n3ap6ok}RdN(i4r9S><D+Q9e>uWi^ylj+D)?S(H_el$~O8D66q=$<i5b)|=hd
z&MK5+^XTsxwt)UlvGd*>{!YukvD7?9_6*6h#V0m9%btbo0(&Ks9e+Ld#9+^{=kfK7
z{5Jmb0{VE7IT*vD+_YE4%-S{DvV6zlYb6K2|Hn>Jb=t`4elO^`Y_u`j#IDdg;d6yH
z<~byZ+Al=PV<k~sHPVK9WE`q^H<=1#Y4HO&CONLIANkF|kG<nV%!TroW!?^#@*LGa
zGNvVmpyP~&==j|*YIa**USqv(@gj!D%SePB^xAD;RTSG^bQA9$7X{btHani{3X8sa
zysil&^nz_!<#UCfLd`FJxUzKbz0l*~y>5H3@7=rRg?mx2fA7}H#=VfY?sa<13-0;M
zZDA|iOe=c)Qh%R1@G)oCokc^Tfkd$@YP>kLZI?!3!fx~CR%;N|bz%CQX4?~1$BTA)
zOjz8D2E5y%l^^}+-Ne7#iTCl6Ksoj_K9?v%?8+h5A0-+}&Z9)lOLUaHi4rX<QFisA
z!Hh)vrNYc#>4&O{y&Sc`EbO8kf0?iA2GM{wNetV(*Ky=<bD{j@_%2GpC1<VMA4F5N
zXp__VE;(0^6HofddF?{BN*7*tE<`)r3wL?}qfD#Ujd}xqp`Le7E#{dGxr9@oTBBul
z9{ADD<dh`Wc`UEW=drw^nD-{^tgm?Xz3yJO_n?~(Jf3;o8H9kElMQnngm}))GVYjA
z-HcGh^KRbmNuSTTSzjl7<TErb`$3a;(PLfbgf#vPB@2`gg41LUZ{k!suZf19MR7=#
zlyX5WsoB3auf{J;qx4wax|a5I2DMw06hRtC+%17=fxF{>iX;Gc0Z^uW0v3z_x<l<i
zqjIJrXCQ~?M9xUmvHU&lz&x-Liy6-<i78Wynez&>WIlV_HV*8_99oH*Xo;QZiNTQH
zwGV9-Jq`=0Iv_3VX;*Oovf`mWEV9y}dQd=}0!F8PLSsaVF_pIUv&y`3P)v$<l{<=|
zMCG5U`--X@lvE{tIZ<{i!zwE$rC%z)(xlp`cNI(d07vpc=~3xU_IyKm18-2HO8k2{
zqBf4HQ3{&tV1N~9Ml)#lI8fQiYpg$|HO8VB@OZjRiF_j(cuM5*l*oY7$tp#JIq<vD
z58_u=Imb!vcSnFc2J~jI<kV|I>-L2id%PD4Gu&zRJ^l*X683h`YesK=Pw1`tms5(u
z0L7{6EAHC*+NOJVZS#h^vAVJ;%m+Ij2WK_IXut0XyX!q@KJ-ITTz%N`q%Dx*)%0jY
z_3{|4!ss-^y+(1X&0I;SjpFv`RaiTo-`<JPyw9Q?VQ^Rr!lVk9i5J5`5DC?r!a65p
ze+T~|y(osJE$TJ3rq8M8^+ny$pVKUDR-IGh-<ihw|Dmd1kMe&<AMwvqlmj_hhHafF
znQ4c*#I}*>Op|CgA!D6U4h`ViI6!V_Csc-mbQhRJsdZo^7XPcLlvpS$GviYY*aqGb
zAngEh!&*{E>^8LLP$zWn&H%xLVe?acgxCall(?PU|JMoBo*K?E>jc!=8EWNIqSgj#
z3-Oyd2EPuqIf0QmNTf?YK=nM9B~1vHPrpL)xhnKMZ~t?ZU#2y?kfSqi<3xO}*H80{
zs2~ch`_T%l6E12iumCpPtJgO!U*A~%Kvb?b2Vv+pyH|q&=Zhp<-Mq1}dgq3Fb!~ll
z;{#F7vbQ$xyeBH#ewVGJM@A^B8>^ce?&|xSs~hXfH^u3d8_R3!?(*&18@Jwf@2vgk
z_RUqHcbX4HIb-8x?lt+V)JaL|j2rlSo+xblL2$bl?2Gc2A3g9x&xO6r-+-LNKL1_3
z9YsD)hW&=UMPv4uP+^UvD}kAg1~(HldD{!4(Mceej(?vT{Q)IMX`Y`$**gBi7myJ2
zYkEz8PG8UsC_qV_)n`=;@UId4zkLk;`94e>6Qi^0hyqm5cuw>GflT~2->d)tssz6T
zIiQ~y{IkeT43rm`4v>T5(Ml0iZystOUmH0nL1H7X1Nh}(MXEp%<<+E^6rciDrUEso
z0!3y+1xiVYz@MwY%>KVY1<Dz5&kj$qLQ+0P+{J_PqcVtFKBWp2p#r7fg1EEI$}Cd&
zJ-Hq{C7?h3ITF5vr2Uimf4u&m@n>&u@*h&!6(kcRJ!)rcD2zO>C79-OQVIC)Q^mKC
z2y>;`?e6odR6yq~zedR_CGR2;#U^jv^tx>jXQkPPdHRshdF{4@F27E4Hz--7WD2I0
zF+uY`pvFv(0fziXB>RVy5Xyw@^+P}CbsJXN!8f3je1?zkA38`z=uELWdmNv~={Z}V
zZ$hVq#&dN3Ju-1Hjm};2qd~|(ou0r323f-nh5?YKCLRCqWk&hD^a>dhC?_m~=n1bD
zObtS;4%#*{(zW-01H{2Ym!?7ih6YIf7~-G<k4zv=J|*IeDbii-?vQ7b8q3Z{1GrGp
ze(IfjQRHz4u1F5HHZ3ZC?|^+@!c!)7tx;?Re*dQ5@uNm1@&oTW_t_n|V(Zdifbh#C
zOi6qurDRWbONMM_ve!#v@QLb}d~Ysa1uKFMBX8yA@{Ltt0taBgOaz}VgQNM|)WH<O
ztTDob9yGTaW-Dm!c#T5ZxyMf8H&M;Lx^iHDjdnw_&oeBkm%w(l5x+e@&2LBQey;fr
z>?i+ym{zc!$#53sh{!f_L#z&$wk=s$qaT@EIjnwzOuP*k(8)`1z-bTa(IdcV*LVzY
z!PUA9c$f*<xE6t>3oAfE2Be3R+=Q%}%YG<jr6mAa3$oJc%>Y&09|BOYWhJ0W!!pwo
z`vgGQk8o}SP<ZBmGAB;)^&an}ez;sfhh{3nI<PpsZq%fxO%5oE2EdN=c)u6OFDXdQ
zrXcBNO-;aLy<SOAYO>AHvM8;s<5YE*H&&Oi$zGSghGm<eu!<)!9eXz@YLuPobfQbx
zOd+N)MhyQk+7Wiz3zH1hD301<Uwb@?nbDxV6hQxgW^yZW4p!o<X6U8#IfBuP(=eK9
zW3z6Hl3Y!<j~JLJ^#&0fT$lM=6i1#@8&sL<vMA>D<t$R1*%-*^SH(+?vj(iE2uImt
zwGB^#X;1V6`)6uwMCuTzqjKrN-~b&c{3`sC)S*{%Y}n~hxNE{P)RLlf^tE&FW0Jzq
zI>fP<==_gmJsXyxx?9L=(otMS>t!6&f163zQxc_2!sP#)Nx+*r(ndKcCxm|ZO1qWa
zDl6iz^r;5BRUOtagVJLaZ6J?hzI;|0&ZK4JQ?Vk-DpwGaz^rUmooxB8(tQhF*(|)W
zO=w01nt@P<oIOkd%yK5FU?$KrRk=%knSM}tROyz|C+S8)7Vd2G*I3{j@mW00X+kl&
z?LbDWD7Z5ft;prSCdMIwu;frk)QNiVzfKN#jDfP`+>)Si02&z(-Osxqb2>-Sl5=+l
zQ6UgNnoUb5Oy(nXGPoV7k(Eu&hI+^`c|<-hJ)y<~RW3Q3k~dQ}q1f@L;!!@Kj`A^{
z7?R1>pC~2u?!sLDT|~x8awStWt7NN3Iu{B%9JDBQy&f;D^acUL2qFj0YqoPsPFx!W
z=sb35x8IJ>N{5DenlQIyJS#4(=I38rS)ZV}&CfMq_nRC{8H$1j2RCwidpv-`@(z-?
zluf{6PJAk*N!VR9FzV<F4bJu{p@$LAXwvWC>||s2071ye>j<OOLk!XIyW2fsP@s~N
zInV!y5)X;6(m}u#-Xof^{muhK49NfP_r1*Ns8>_I+@@M&8}J=Ud`fmHAr4KcQbvs;
zWE-_?xE|t}SlGtQI4>#g#6x)`<YuAJe?dzj*}KY|rE047KbB>{<tV`EuyhNCUO_X|
zd9^f=R^XVxC)Wz<B7E~pT6~Okvw@8Is2ie~q5%sarza|DMA+T-IaXL6-!kw@1Hq3d
zmck@ty@qsrC)zGiDoB;+2sHR-AP~?h+-jBLphPBgxHIFN0s=GBHwr}!%|nH=Oxnz(
zQ4R^~oU*O?N@Dz4{R@i1Qj0dTa~W!HN~XIADH*t${=y2NsAAJQk)nctV(DXc3MtOh
zJb^)S6*_^fh?(f58bxJK=AYl1s3v#d2$Q5AMgtBVxkp*Bl%o0h7>Oe;Ufe@i6L$d4
zGGn+npo=621%nPLo-}{QT6Lsmo;i_St~R6A4lb~Ag`DP?P2L4A;+L<<+YeG%y76l9
zUcXP7Y`Mcrmo6a+Or;)+U${MPFDpADSj_r^=y%t9X=9)VsZBH&+^@YpIVKolxUIm1
zQ;GF@f$w8bDM#F=H+id3-J;2iI89iRj6!i{RN`i1N$s4FKaZMqJ7t6eYDF@_BfJSK
zU2WW7rPJ<p;qy~yEo{KHm$M{@OobZ6!jTb-^fD{}tRY39m6@7mXccu%FF^GxQ0$8O
ztRBBQZBCus3{3LzFprtyWFpZGkJRN4(c=y@`R~*NqYbYsQHKfwZ|XJW$LFQCs?gSj
z#M;FT)gd(VKIKg4wnbX`5#GZOp@9e<!>A_H!ANgH=;jpHiMS<|UvYC96%z9?Nfa|V
zsrzXuE5Sf3lX(^uNeaFHIf8iwm|fI1Y9l~bIisL<HE*Yu6n80vEJu<Qhh@5#foZ0Z
zu>>Ox#uH4Y8T`#kj#73}BPmOU(TQOWDlm~w!E7>;isYCIn>(xU&ro{WRB+{3`97}f
zt|%XUmW^UQV<H;SGmu(1ixFiZ>~x%GsP055nMsSdB__?JUxxP_$x|c*`(?mG|GpQD
zZJ4)+cVk1IyT+w{w;h|8B7b`uMO&RdGP`}RE!2zgX=uo#W)P*tr==E#gRK!c`Cj;L
zJToN<KbDSQ8D)#h6G|CZ^Cs!GDs_5wQHgp{Gsx6K%;s7;Dk0~BbU+5wzfix!DR7Yz
z1pia&NcQ$8G%+}uDGz6j5LdK%9b9%t9$Sj%9Ov84CiRvLWXa(_rFt{;AsZ<Ko%)P0
zc{}KB;Xn^@j0HH*!@>5p|4^7g?}5kpPpD(M_>t4(k`9{4ilWyAJ97Bp`~l_5+#{Fm
zzUSh0{UKG5B$D85WEYIp>tm`hE7#ri9!6d_1m%XJoR-iy5Xh&8v<c+wh3a!MEJQW$
zNIE~&?5Ie0E441BLX?kD?IMxH_wb^a1=WDRwV+lqYv2V~2-0S-XVupbvMi}J+)347
z8O-Sw$Sr8`g=q@;8q%w)xX_mOcX-@GXLVz9b2EKYH|uA44P~O_(!Ij~vvWnob;%*k
z?uKpGWxbZ`axx>*8|BmV_9|7gyR69(zvY~Yq<u!$4Kf1DDbSUgYh-l@9bU9F+&F>_
ziZHf%y?~QWaElV!75)h&v^EnwD_3rg%1TIx_e1I%OJ>ZM7N41aasFHL=jRul7jQB4
zrKK9`!k3k|m9H$d@>S(!S*JeBe?j#xA`vDq(%;X9PumsvTj_`_+}Z%OTqjvM+wtgV
l2Al%E^599AfrfL^I7Q(~x|VNYgO!lh*U0GqIXVQi{{_={8O#6x

literal 0
HcmV?d00001

diff --git a/src/model/__pycache__/yolo_detector.cpython-39.pyc b/src/model/__pycache__/yolo_detector.cpython-39.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..a67f54a06b6400e5a637a096bd6ebf4e3efd2097
GIT binary patch
literal 7104
zcmbtZOOG7ab*^_+S3l>$;mnYx%Z?JT6>B6h4?7crro@LOgBdd9D74yRw`=-V_f)gG
zx_PUboas~xK`1S<FrchO0W(Noz}qbH6Ou(XfssW}s{mO9Tzf|cQoeJmy1IuP7y(>8
zb?UzFJ?Gx@opaB))v7Jwx%BJ5KluHoB>gvK79SOv>v*F+2$Nb8lbI68Em?e(mWr<$
zXal{a%T%WY#=vZu1FK~XO0CksZrOu!t1Rl2pwg<KjUH47wN@=JtGDVukeI>DPbFqP
zQ(6tCJdm2!<cj_A-8*-kn_ld7;vsjsct5=9+;BO|3;ki}xFK_H@Zo6WhduiR)+p^X
z<y5=p#s^J3)$aIFoa(#dQQ)Q4-BFA#Zjfp>{Z5>!?}bOymZs@Y&&9_?<~rW!A3;0`
z{7Nl_$>8^#r+NB@<QYtRt}vY$pXx2sv%HdLd%9QdDjU)UI6<AoN}p=rcumw+(MR(v
z&?>&QejTmK&vjN|RgBPJ=h4dYmgb|d`g4sn*b-`&+4^g>%cxyptEgQO65B{C#K}xv
zlk2vFhl<|XcO#EE>=j9NNRnCMOp=|MB&qAp|A2Ko|MmT*lG=kI^MdvWa!u{dFzouw
z3p-wi&d2Pbw1)Qv-so>Z5+#w^QY;@Uv3epSttB$Q9_xwxOg=VFB&1DBqsB_4zII$<
zaw2~reW{$tvJ|exCR0w;ViZ}5?SA>Vg5Hd2A$9=0t9fq&-|DPCGsQXjCm{!7=)=&D
zeK+tYo)AkRkfK46c#rp@?IK5g=j?Agbhw;&m<=K-oUR{u&gHF9+&tB5E~stiMj<pO
zKHy$-FbtSD)WsGQT_>0B3|)pT>x`p#I5;&CM}A@-4TIs6?}eCf^39JToPB4+y|-fS
z`XRc}rlU4nbgFg6%uUtKXgsN9ZJGDP?|9qJPP4`<*r(JChP@s}NlQI1zJs*KQ>)z$
z-GSF`rv}w}oGaAS@D8C<5w|F#3+_|R54*!uhn98@coh|`iXXMzC$1m3`_Mcio3N>-
zTI2;?UPco!@h>I5f%MBixv{<XQRMMxFYJwvyuF)V^e7&V_U_)ezZdb&o|tBjm~PKb
z@z&^wmgr+o+wCO`5-o#BmLXTvhHT5Ls*TjDJUO?h6<f0&bfo=(+w-y`ZE!Ch^RPoK
z&K??+z)>7$CQH)i@?<lXj^$XPLwh1ml?0G5miQGMJM~y&D4!j^p7c<9Afa3*CFmPW
z{kbw#d(u=()SJ>zo=^2e@0(L2F))J6f0!63{d8(3X5V7khICvyk&f*XX-}J4)6&$Q
zmg6$&DpdDOo>t;2a<x21$6xQ)6F|(gh8pXc3|bP@7PS0K?rBLSsV23=PONn)DJP|M
zX;otSbA4J*wBtrnC*^wlv&TP7wEj{K$bhh)D>Ct+9xpRHUP-iP;E|ORxxWftHR_XS
z#H%L7=RTK@ekx1ThAd4ki#{5wkW5%LY0O%aWDMzJ7>jA+lg5Mm`;PPuQc&31<X;Ot
zxG4~eP@k|Wa(u#jM{HZsrbxW5v-AC(>#Qgf>RNOp^)52^#W{FI`N@hn!|noDLVw3W
z963*YK*9cS95T|u{o$b(6+`X3T)QzGL&?Ko>;zEgY~|Yy8683fjx!~ZmD)$gOcAY4
z;6_o~X8>7|A{9(EmwRr9TF)Lz6Wl()8#O=@NN<BE%ukmLsJbIY<iCeXp=6j<J`|~p
zY@#Byt_JR4pSjoWBll~((q!wDzGUi#1+~Q%Y+Vh89XE)sA(3_5g(j(wyrb0Q-V<oB
zH!*ILJe)~=E-$fllZ&@FhY`>54)R*u*p~_fvj&)YawRqV0T^bf8pWKGTBkbTXUO>~
z(wU%iA?ucQcyxHgYobXw9sm>cE<_#kZ&H!!hcNS<AWC(TW0V^1Xyk<qFf`;bKPTD*
zUYKe^%%xk09Z&cO%_Y80Q(Y7Ti!(#~i9Jv4oPlA80kcBBC5FP9Qswa7R5`+Xcm>}p
z*(Q982KzR(DHWYl*?V<2>aR!}4w)2v4@9yxr6ybQvTUdgMMKKKYbl#@4Zn)IDJ$Yv
z`;B4N)Me$8Y$y$RU7lS0ZJYUm(5<NpF1dqrS{{z$(Kya9(Hyyqjy3-VsyaHz>>+s<
z$he8KIQfrLxCm?$xcE+v0SmbJP-r=@4=tGb8BXh-GBtpE$^z2CwMwi+TbG_GQ!A!i
zDbJPQFql9v?L5`l$QeMgELTo+v@3t6ps)RzLXOz9lBoRO6SZ&kOK{cTtPz@Ftu`=R
zg=<kcnW0;mnTa|>@1&9=S_O!<3Ph^{(f%Ok#uA8DO32X=`1deFv+5^RLNMSOQU#vb
zZW{tBK!JSK*|~SRWXv-}8Ve)7h$KaqBJux3xDY$|3P=*f5y)&i?=N7L^W(#JzvCR?
zJ-mYNm7f$dQTv6XFo(~`ed0O7ON5&tR(`5aeqyM-I698Y1s22y-YJwk)v3swiM_(P
zpH1etkt5U`19SJN=()o$;Yhw9>n%Wa_m@hF<IBA;j#5i_EbZZ=$@vFZKD;XOa*HA1
z$jy*RR1lEoz?5weCpBzV`I|KQ9}@Wv5yB<@7D%c`2kyvA)q#5m;)kh`O%3<x5%YO!
z`h%z3k39i6ob(xfSAj1=^Z0EV?FU5ujD|E0Jim8<tIJcL!CSmW72hXvoydD2shP9E
z$v=4&Nh(x1L+u}<L39~Jsw*=XQI-K41RnUQtEwh9@LN`L*w{D)8;fJzZfY4S+WGk)
z2CH-|+C%QchjfDsFX$pLd&oc)c=4Z5hgc#HswefJElhc?O*Qydf0MwsO31GQeni)x
zZOXCARCpR%p_jtbzy(5oCc|F}a_lh451K+R`^FS{4xh?6FTv|Dzf`9-{IAj%Qex8>
z7o=$!v*6MJj3}R|z=sO6;D6mtG**JwWhG|j(J-5GSSLIuDtUZ6Q9qY?H_?g4B_N34
z0jsShI@Z!9-z{4QYRmAnELMg^wwOT{8Q+S?!AI*Vti~!QxG<w7`D7-e%V6URpx(R>
zTUtlUxYVz*WzpWmDt-lSz$JKF5!}=;LJcda0n4g{WqDd-t5+p<4qUBWCGSl+uCw!*
zB-wi0Ksopmp4`TlI`Q{V3a`O~TLRww3V2rs-n}9EEwfF5ck4<06y90W`X}|!X5vd|
zmuT=hF1U9V(e54}cDyKZT!-KdS0n)$+qnxMF7I@>X8JbwoeItV-7s%{Mz@{2!n8R!
zuOgmsB<^0h4rS|_Pfz%F>P&At4-Y(`7^i!m0KwU5&$|9rN03G<7&;T=ayb$7<X%S6
z9tzj8eZq8MmHD4Tm(ps!Zc!AaW;E`QoG0r$!$Ow1kO}8PM}SPr5KdhC1-3|fscrQ~
zy&W+g{}BoVaPkk3dO@CLQxyd-zAmchrZ`czu5|e=DkFuS)Y@(c_tuR)M#H7GA}f}*
z%Ri=8cFrHxBEWP~%N_chjmc8x8IH2!LSksHWGH)+rV=io`PAhhs`z(Nl$Jc$0gq#1
zICHT#;2%-LKPFP(bXuaVcIn{38jRyz?=VhRZ{OY7ZGUj<{(}#0ecXQV;a}XlbL&U^
zFR3H>gZxj45Jn4ZZ#EWy`md<;A(5*@#7@XQf1ffA5f>yiqH(wDA7+TYOT~of{HH|D
zg6h?r>vpChZJ{E6ht?78g;X;#-|l}6Q&VjCeyijI%9d&nWUDpB0)(%s6;ODD@|!4K
zlZ~$ojR3uZ+RN|+x0K1ZPC@!vb2hcKlpQqa2q$LKnoxpbPhUrNy6l(m5@XT7;9Mn2
zpD-P$PM+3*#MFO~ryB0P2>Ki&Ja|I5{RZ88j}?S)-bf6(IiCPMo={Fd26_v;MLG(A
zK*q5NM5jBX@udj=Fp~mn&vC~QwH9urC9(%-fm^9)ClD<wMR*NA*qJKsxn^wVmgApc
zIdHF@jR4%O35!uL#%d&`ei?`-R+A7;lVu`nV)v`Uj+7TUg;lAM_nD}|s+epE_Ctq%
zDdT=zVapp5{{?V<MW^6k?Yp?V0hdj-N_os#Vdn^si}JOi{QSK9@h|fAu8UDgHWu5!
zD4QFwc3IFYZ*hU<dad*#&G=gBH&D8^P)cF5OYZ$MaXbies1$ec1u&&JY&71Vp{u`e
z4=$kW3@jJ8hECfE&XL<X>wo0nf*d27MOYv-;xst_&cI%r>DQ6Hs5)!nf|)aM{Czj>
z93T`Ytln8@zRN#^rd*@T6eqWAqHT@B-bCMu{cabT{lN&C{>ba4@|%+tz<I_zj1}Ff
zf#j1FVKz_8`u3#$O4FtypjUv{q<n9_qDi$Fl5QUY<Pn3Y#6a;N1D_~u<SclsD9P%J
z+iR3ovyvRb`8KiC0(mLFEkHgiA^hh7kpU6HOdb*;lQX&Sn!q~40b=zqC)<-{$9c=y
zrDf$S-gfvS>Q$$ToFz1LCTsJS^97=OWnP{y6ETK5zlT9mo%e#_K78}2O~G5<6@|g@
zDIyKRj1>O;f?fC-8fEsU%)P*keYm}ddfuht9tds;!mmG|0%0zEq|%1i#5T;27e<J+
zM`<}Lp_!w!M4!yM3n_ZkTZA5}#VizfZ&mYSpKX3-g*K?MAR?es-KQhi&iC)%P#KYZ
zl4>>8k~MhzYcL9AL~P{}Oh^_sP<~^S8uDdCOl`S_8v+>>3Lk93tgK}}WwLq7fSj79
zsq6@MfWG7#H09g$x5_Dmn%eC);<sb4*iI|$_T#Y|<bh?g-Dbm1yUm3@h+EY==)o@#
z5tljgM7TkO{vpGKH}Eb}sS=J-Gi2f#C~QBXXv1M3c7Y#K+qqy0>2NYt<i<qb27x@Z
zwe^dCB+1fOHUcX4SCzM=uMt1~x^g4?iuQ;F{WXmz+={m;m4MLoGCm0W{X8ljAJKoH
zxL7Y;eKMBjE3c!hRYuH^yTMWHcd`IFU!$h9s<W1h=v*eaYvizrFrS89wB(9>QBX_y
EKQ$^5T>t<8

literal 0
HcmV?d00001

diff --git a/src/model/id_card_processor.py b/src/model/id_card_processor.py
new file mode 100644
index 0000000..710f0cf
--- /dev/null
+++ b/src/model/id_card_processor.py
@@ -0,0 +1,343 @@
+"""
+ID Card Processor for background removal and preprocessing
+"""
+import cv2
+import numpy as np
+from pathlib import Path
+from typing import List, Optional, Dict, Any, Tuple
+import logging
+from .yolo_detector import YOLODetector
+
+class IDCardProcessor:
+    """
+    ID Card Processor for background removal and preprocessing
+    """
+    
+    def __init__(self, yolo_detector: Optional[YOLODetector] = None):
+        """
+        Initialize ID Card Processor
+        
+        Args:
+            yolo_detector: YOLO detector instance
+        """
+        self.yolo_detector = yolo_detector or YOLODetector()
+        self.logger = logging.getLogger(__name__)
+    
+    def remove_background(self, image: np.ndarray, method: str = 'grabcut') -> np.ndarray:
+        """
+        Remove background from image
+        
+        Args:
+            image: Input image
+            method: Background removal method ('grabcut', 'threshold', 'contour')
+            
+        Returns:
+            Image with background removed
+        """
+        if method == 'grabcut':
+            return self._grabcut_background_removal(image)
+        elif method == 'threshold':
+            return self._threshold_background_removal(image)
+        elif method == 'contour':
+            return self._contour_background_removal(image)
+        else:
+            self.logger.warning(f"Unknown method: {method}, using grabcut")
+            return self._grabcut_background_removal(image)
+    
+    def _grabcut_background_removal(self, image: np.ndarray) -> np.ndarray:
+        """
+        Remove background using GrabCut algorithm
+        """
+        try:
+            # Create mask
+            mask = np.zeros(image.shape[:2], np.uint8)
+            
+            # Create temporary arrays
+            bgd_model = np.zeros((1, 65), np.float64)
+            fgd_model = np.zeros((1, 65), np.float64)
+            
+            # Define rectangle (assuming ID card is in center)
+            height, width = image.shape[:2]
+            rect = (width//8, height//8, width*3//4, height*3//4)
+            
+            # Apply GrabCut
+            cv2.grabCut(image, mask, rect, bgd_model, fgd_model, 5, cv2.GC_INIT_WITH_RECT)
+            
+            # Create mask
+            mask2 = np.where((mask == 2) | (mask == 0), 0, 1).astype('uint8')
+            
+            # Apply mask
+            result = image * mask2[:, :, np.newaxis]
+            
+            return result
+            
+        except Exception as e:
+            self.logger.error(f"Error in grabcut background removal: {e}")
+            return image
+    
+    def _threshold_background_removal(self, image: np.ndarray) -> np.ndarray:
+        """
+        Remove background using thresholding
+        """
+        try:
+            # Convert to grayscale
+            gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+            
+            # Apply Gaussian blur
+            blurred = cv2.GaussianBlur(gray, (5, 5), 0)
+            
+            # Apply threshold
+            _, thresh = cv2.threshold(blurred, 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU)
+            
+            # Find contours
+            contours, _ = cv2.findContours(thresh, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
+            
+            # Find largest contour (assumed to be the ID card)
+            if contours:
+                largest_contour = max(contours, key=cv2.contourArea)
+                
+                # Create mask
+                mask = np.zeros_like(gray)
+                cv2.fillPoly(mask, [largest_contour], 255)
+                
+                # Apply mask
+                result = cv2.bitwise_and(image, image, mask=mask)
+                return result
+            
+            return image
+            
+        except Exception as e:
+            self.logger.error(f"Error in threshold background removal: {e}")
+            return image
+    
+    def _contour_background_removal(self, image: np.ndarray) -> np.ndarray:
+        """
+        Remove background using contour detection
+        """
+        try:
+            # Convert to grayscale
+            gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+            
+            # Apply edge detection
+            edges = cv2.Canny(gray, 50, 150)
+            
+            # Find contours
+            contours, _ = cv2.findContours(edges, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
+            
+            # Find largest contour
+            if contours:
+                largest_contour = max(contours, key=cv2.contourArea)
+                
+                # Approximate contour to get rectangle
+                epsilon = 0.02 * cv2.arcLength(largest_contour, True)
+                approx = cv2.approxPolyDP(largest_contour, epsilon, True)
+                
+                # Create mask
+                mask = np.zeros_like(gray)
+                cv2.fillPoly(mask, [approx], 255)
+                
+                # Apply mask
+                result = cv2.bitwise_and(image, image, mask=mask)
+                return result
+            
+            return image
+            
+        except Exception as e:
+            self.logger.error(f"Error in contour background removal: {e}")
+            return image
+    
+    def enhance_image(self, image: np.ndarray) -> np.ndarray:
+        """
+        Enhance image quality for better OCR
+        """
+        try:
+            # Convert to LAB color space
+            lab = cv2.cvtColor(image, cv2.COLOR_BGR2LAB)
+            
+            # Apply CLAHE to L channel
+            clahe = cv2.createCLAHE(clipLimit=2.0, tileGridSize=(8, 8))
+            lab[:, :, 0] = clahe.apply(lab[:, :, 0])
+            
+            # Convert back to BGR
+            enhanced = cv2.cvtColor(lab, cv2.COLOR_LAB2BGR)
+            
+            # Apply slight Gaussian blur to reduce noise
+            enhanced = cv2.GaussianBlur(enhanced, (3, 3), 0)
+            
+            return enhanced
+            
+        except Exception as e:
+            self.logger.error(f"Error enhancing image: {e}")
+            return image
+    
+    def normalize_image(self, image: np.ndarray, target_size: Tuple[int, int] = (800, 600)) -> np.ndarray:
+        """
+        Normalize image size and orientation
+        """
+        try:
+            # Resize image
+            resized = cv2.resize(image, target_size, interpolation=cv2.INTER_AREA)
+            
+            # Convert to grayscale if needed
+            if len(resized.shape) == 3:
+                gray = cv2.cvtColor(resized, cv2.COLOR_BGR2GRAY)
+            else:
+                gray = resized
+            
+            # Apply histogram equalization
+            equalized = cv2.equalizeHist(gray)
+            
+            # Convert back to BGR for consistency
+            if len(image.shape) == 3:
+                result = cv2.cvtColor(equalized, cv2.COLOR_GRAY2BGR)
+            else:
+                result = equalized
+            
+            return result
+            
+        except Exception as e:
+            self.logger.error(f"Error normalizing image: {e}")
+            return image
+    
+    def process_id_card(self, image_path: Path, output_dir: Path,
+                       remove_bg: bool = True, enhance: bool = True,
+                       normalize: bool = True, target_size: Tuple[int, int] = (800, 600)) -> Dict[str, Any]:
+        """
+        Process a single ID card image
+        
+        Args:
+            image_path: Path to input image
+            output_dir: Output directory
+            remove_bg: Whether to remove background
+            enhance: Whether to enhance image
+            normalize: Whether to normalize image
+            target_size: Target size for normalization
+            
+        Returns:
+            Processing results
+        """
+        result = {
+            'input_path': str(image_path),
+            'output_paths': [],
+            'success': False
+        }
+        
+        try:
+            # Load image
+            image = cv2.imread(str(image_path))
+            if image is None:
+                self.logger.error(f"Could not load image: {image_path}")
+                return result
+            
+            # Create output filename
+            stem = image_path.stem
+            processed_path = output_dir / f"{stem}_processed.jpg"
+            
+            # Apply processing steps
+            processed_image = image.copy()
+            
+            if remove_bg:
+                self.logger.info(f"Removing background from {image_path.name}")
+                processed_image = self.remove_background(processed_image)
+            
+            if enhance:
+                self.logger.info(f"Enhancing {image_path.name}")
+                processed_image = self.enhance_image(processed_image)
+            
+            if normalize:
+                self.logger.info(f"Normalizing {image_path.name}")
+                processed_image = self.normalize_image(processed_image, target_size)
+            
+            # Save processed image
+            processed_path.parent.mkdir(parents=True, exist_ok=True)
+            cv2.imwrite(str(processed_path), processed_image)
+            result['output_paths'].append(str(processed_path))
+            
+            result['success'] = True
+            self.logger.info(f"Processed {image_path.name}")
+            
+        except Exception as e:
+            self.logger.error(f"Error processing {image_path}: {e}")
+        
+        return result
+    
+    def batch_process_id_cards(self, input_dir: Path, output_dir: Path,
+                              detect_first: bool = True, **kwargs) -> Dict[str, Any]:
+        """
+        Process all ID card images in a directory
+        
+        Args:
+            input_dir: Input directory
+            output_dir: Output directory
+            detect_first: Whether to detect ID cards first using YOLO
+            **kwargs: Additional arguments for processing
+            
+        Returns:
+            Batch processing results
+        """
+        # Create output directory
+        output_dir.mkdir(parents=True, exist_ok=True)
+        
+        if detect_first:
+            # First detect and crop ID cards
+            self.logger.info("Detecting and cropping ID cards...")
+            detection_results = self.yolo_detector.batch_process(input_dir, output_dir / "cropped")
+            
+            # Process cropped images
+            cropped_dir = output_dir / "cropped"
+            if cropped_dir.exists():
+                self.logger.info("Processing cropped ID cards...")
+                return self._process_cropped_images(cropped_dir, output_dir / "processed", **kwargs)
+            else:
+                self.logger.warning("No cropped images found, processing original images")
+                return self._process_cropped_images(input_dir, output_dir / "processed", **kwargs)
+        else:
+            # Process original images directly
+            return self._process_cropped_images(input_dir, output_dir / "processed", **kwargs)
+    
+    def _process_cropped_images(self, input_dir: Path, output_dir: Path, **kwargs) -> Dict[str, Any]:
+        """
+        Process cropped ID card images recursively
+        """
+        # Get all image files recursively from input directory and subdirectories
+        image_extensions = {'.jpg', '.jpeg', '.png', '.bmp', '.tiff'}
+        image_files = []
+        
+        # Recursively find all image files
+        for file_path in input_dir.rglob('*'):
+            if file_path.is_file() and file_path.suffix.lower() in image_extensions:
+                image_files.append(file_path)
+        
+        if not image_files:
+            self.logger.error(f"No images found in {input_dir} and subdirectories")
+            return {'success': False, 'error': 'No images found'}
+        
+        self.logger.info(f"Processing {len(image_files)} images from {input_dir} and subdirectories")
+        
+        results = {
+            'total_images': len(image_files),
+            'processed_images': 0,
+            'results': []
+        }
+        
+        # Process each image
+        for i, image_path in enumerate(image_files):
+            self.logger.info(f"Processing {i+1}/{len(image_files)}: {image_path.name}")
+            
+            # Create subdirectory structure in output to match input structure
+            relative_path = image_path.relative_to(input_dir)
+            output_subdir = output_dir / relative_path.parent
+            output_subdir.mkdir(parents=True, exist_ok=True)
+            
+            result = self.process_id_card(image_path, output_subdir, **kwargs)
+            results['results'].append(result)
+            
+            if result['success']:
+                results['processed_images'] += 1
+        
+        # Summary
+        self.logger.info(f"ID card processing completed:")
+        self.logger.info(f"  - Total images: {results['total_images']}")
+        self.logger.info(f"  - Processed: {results['processed_images']}")
+        
+        return results 
\ No newline at end of file
diff --git a/src/model/yolo_detector.py b/src/model/yolo_detector.py
new file mode 100644
index 0000000..b1974bf
--- /dev/null
+++ b/src/model/yolo_detector.py
@@ -0,0 +1,266 @@
+"""
+YOLO Detector for ID Card Detection and Cropping
+"""
+import cv2
+import numpy as np
+from pathlib import Path
+from typing import List, Tuple, Optional, Dict, Any
+import logging
+from ultralytics import YOLO
+import torch
+
+class YOLODetector:
+    """
+    YOLO-based detector for ID card detection and cropping
+    """
+    
+    def __init__(self, model_path: Optional[str] = None, confidence: float = 0.5):
+        """
+        Initialize YOLO detector
+        
+        Args:
+            model_path: Path to YOLO model file (.pt)
+            confidence: Confidence threshold for detection
+        """
+        self.confidence = confidence
+        self.logger = logging.getLogger(__name__)
+        
+        # Initialize model
+        if model_path and Path(model_path).exists():
+            self.model = YOLO(model_path)
+            self.logger.info(f"Loaded custom YOLO model from {model_path}")
+        else:
+            # Use pre-trained YOLO model for general object detection
+            self.model = YOLO('yolov8n.pt')
+            self.logger.info("Using pre-trained YOLOv8n model")
+        
+        # Set device
+        self.device = 'cuda' if torch.cuda.is_available() else 'cpu'
+        self.logger.info(f"Using device: {self.device}")
+    
+    def detect_id_cards(self, image_path: Path) -> List[Dict[str, Any]]:
+        """
+        Detect ID cards in an image
+        
+        Args:
+            image_path: Path to image file
+            
+        Returns:
+            List of detection results with bounding boxes
+        """
+        try:
+            # Load image
+            image = cv2.imread(str(image_path))
+            if image is None:
+                self.logger.error(f"Could not load image: {image_path}")
+                return []
+            
+            # Run detection
+            results = self.model(image, conf=self.confidence)
+            
+            detections = []
+            for result in results:
+                boxes = result.boxes
+                if boxes is not None:
+                    for box in boxes:
+                        # Get coordinates
+                        x1, y1, x2, y2 = box.xyxy[0].cpu().numpy()
+                        confidence = float(box.conf[0])
+                        class_id = int(box.cls[0])
+                        class_name = self.model.names[class_id]
+                        
+                        detection = {
+                            'bbox': [int(x1), int(y1), int(x2), int(y2)],
+                            'confidence': confidence,
+                            'class_id': class_id,
+                            'class_name': class_name,
+                            'area': (x2 - x1) * (y2 - y1)
+                        }
+                        detections.append(detection)
+            
+            # Sort by confidence and area (prefer larger, more confident detections)
+            detections.sort(key=lambda x: (x['confidence'], x['area']), reverse=True)
+            
+            self.logger.info(f"Found {len(detections)} detections in {image_path.name}")
+            return detections
+            
+        except Exception as e:
+            self.logger.error(f"Error detecting ID cards in {image_path}: {e}")
+            return []
+    
+    def crop_id_card(self, image_path: Path, bbox: List[int], 
+                    output_path: Optional[Path] = None, 
+                    padding: int = 10) -> Optional[np.ndarray]:
+        """
+        Crop ID card from image using bounding box
+        
+        Args:
+            image_path: Path to input image
+            bbox: Bounding box [x1, y1, x2, y2]
+            output_path: Path to save cropped image
+            padding: Padding around the bounding box
+            
+        Returns:
+            Cropped image as numpy array
+        """
+        try:
+            # Load image
+            image = cv2.imread(str(image_path))
+            if image is None:
+                self.logger.error(f"Could not load image: {image_path}")
+                return None
+            
+            height, width = image.shape[:2]
+            x1, y1, x2, y2 = bbox
+            
+            # Add padding
+            x1 = max(0, x1 - padding)
+            y1 = max(0, y1 - padding)
+            x2 = min(width, x2 + padding)
+            y2 = min(height, y2 + padding)
+            
+            # Crop image
+            cropped = image[y1:y2, x1:x2]
+            
+            # Save if output path provided
+            if output_path:
+                output_path.parent.mkdir(parents=True, exist_ok=True)
+                cv2.imwrite(str(output_path), cropped)
+                self.logger.info(f"Saved cropped image to {output_path}")
+            
+            return cropped
+            
+        except Exception as e:
+            self.logger.error(f"Error cropping ID card from {image_path}: {e}")
+            return None
+    
+    def process_single_image(self, image_path: Path, output_dir: Path, 
+                           save_original: bool = False) -> Dict[str, Any]:
+        """
+        Process a single image: detect and crop ID cards
+        
+        Args:
+            image_path: Path to input image
+            output_dir: Output directory for cropped images
+            save_original: Whether to save original image with bounding boxes
+            
+        Returns:
+            Processing results
+        """
+        result = {
+            'input_path': str(image_path),
+            'detections': [],
+            'cropped_paths': [],
+            'success': False
+        }
+        
+        try:
+            # Detect ID cards
+            detections = self.detect_id_cards(image_path)
+            
+            if not detections:
+                self.logger.warning(f"No ID cards detected in {image_path.name}")
+                return result
+            
+            # Process each detection
+            for i, detection in enumerate(detections):
+                bbox = detection['bbox']
+                
+                # Create output filename
+                stem = image_path.stem
+                suffix = f"_card_{i+1}.jpg"
+                output_path = output_dir / f"{stem}{suffix}"
+                
+                # Crop ID card
+                cropped = self.crop_id_card(image_path, bbox, output_path)
+                
+                if cropped is not None:
+                    result['detections'].append(detection)
+                    result['cropped_paths'].append(str(output_path))
+            
+            # Save original with bounding boxes if requested
+            if save_original and detections:
+                image = cv2.imread(str(image_path))
+                for detection in detections:
+                    bbox = detection['bbox']
+                    cv2.rectangle(image, (bbox[0], bbox[1]), (bbox[2], bbox[3]), (0, 255, 0), 2)
+                    cv2.putText(image, f"{detection['confidence']:.2f}", 
+                              (bbox[0], bbox[1] - 10), cv2.FONT_HERSHEY_SIMPLEX, 
+                              0.5, (0, 255, 0), 2)
+                
+                annotated_path = output_dir / f"{image_path.stem}_annotated.jpg"
+                cv2.imwrite(str(annotated_path), image)
+                result['annotated_path'] = str(annotated_path)
+            
+            result['success'] = True
+            self.logger.info(f"Processed {image_path.name}: {len(result['cropped_paths'])} cards cropped")
+            
+        except Exception as e:
+            self.logger.error(f"Error processing {image_path}: {e}")
+        
+        return result
+    
+    def batch_process(self, input_dir: Path, output_dir: Path, 
+                     save_annotated: bool = False) -> Dict[str, Any]:
+        """
+        Process all images in a directory and subdirectories
+        
+        Args:
+            input_dir: Input directory containing images
+            output_dir: Output directory for cropped images
+            save_annotated: Whether to save annotated images
+            
+        Returns:
+            Batch processing results
+        """
+        # Create output directory
+        output_dir.mkdir(parents=True, exist_ok=True)
+        
+        # Get all image files recursively from input directory and subdirectories
+        image_extensions = {'.jpg', '.jpeg', '.png', '.bmp', '.tiff'}
+        image_files = []
+        
+        # Recursively find all image files
+        for file_path in input_dir.rglob('*'):
+            if file_path.is_file() and file_path.suffix.lower() in image_extensions:
+                image_files.append(file_path)
+        
+        if not image_files:
+            self.logger.error(f"No images found in {input_dir} and subdirectories")
+            return {'success': False, 'error': 'No images found'}
+        
+        self.logger.info(f"Processing {len(image_files)} images from {input_dir} and subdirectories")
+        
+        results = {
+            'total_images': len(image_files),
+            'processed_images': 0,
+            'total_detections': 0,
+            'total_cropped': 0,
+            'results': []
+        }
+        
+        # Process each image
+        for i, image_path in enumerate(image_files):
+            self.logger.info(f"Processing {i+1}/{len(image_files)}: {image_path.name}")
+            
+            # Create subdirectory structure in output to match input structure
+            relative_path = image_path.relative_to(input_dir)
+            output_subdir = output_dir / relative_path.parent
+            output_subdir.mkdir(parents=True, exist_ok=True)
+            
+            result = self.process_single_image(image_path, output_subdir, save_annotated)
+            results['results'].append(result)
+            
+            if result['success']:
+                results['processed_images'] += 1
+                results['total_detections'] += len(result['detections'])
+                results['total_cropped'] += len(result['cropped_paths'])
+        
+        # Summary
+        self.logger.info(f"Batch processing completed:")
+        self.logger.info(f"  - Total images: {results['total_images']}")
+        self.logger.info(f"  - Processed: {results['processed_images']}")
+        self.logger.info(f"  - Total detections: {results['total_detections']}")
+        self.logger.info(f"  - Total cropped: {results['total_cropped']}")
+        
+        return results 
\ No newline at end of file
diff --git a/src/utils.py b/src/utils.py
new file mode 100644
index 0000000..fa7f80a
--- /dev/null
+++ b/src/utils.py
@@ -0,0 +1,98 @@
+"""
+Utility functions for data augmentation
+"""
+import os
+import logging
+from pathlib import Path
+from typing import List, Tuple, Optional
+import cv2
+import numpy as np
+from PIL import Image
+
+def setup_logging(log_level: str = "INFO") -> logging.Logger:
+    """Setup logging configuration"""
+    logging.basicConfig(
+        level=getattr(logging, log_level.upper()),
+        format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
+        handlers=[
+            logging.FileHandler('data_augmentation.log'),
+            logging.StreamHandler()
+        ]
+    )
+    return logging.getLogger(__name__)
+
+def get_image_files(directory: Path) -> List[Path]:
+    """Get all image files from directory"""
+    SUPPORTED_FORMATS = ['.jpg', '.jpeg', '.png', '.bmp', '.tiff']
+    
+    image_files = []
+    if directory.exists():
+        for ext in SUPPORTED_FORMATS:
+            image_files.extend(directory.glob(f"*{ext}"))
+            image_files.extend(directory.glob(f"*{ext.upper()}"))
+    return sorted(image_files)
+
+def validate_image(image_path: Path) -> bool:
+    """Validate if file is a valid image"""
+    try:
+        with Image.open(image_path) as img:
+            img.verify()
+        return True
+    except Exception:
+        return False
+
+def load_image(image_path: Path, target_size: Tuple[int, int] = None) -> Optional[np.ndarray]:
+    """Load and resize image"""
+    try:
+        # Load image using OpenCV
+        image = cv2.imread(str(image_path))
+        if image is None:
+            return None
+        
+        # Convert BGR to RGB
+        image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+        
+        # Resize if target_size is provided
+        if target_size:
+            image = cv2.resize(image, target_size, interpolation=cv2.INTER_AREA)
+        
+        return image
+    except Exception as e:
+        print(f"Error loading image {image_path}: {e}")
+        return None
+
+def save_image(image: np.ndarray, output_path: Path, quality: int = 95) -> bool:
+    """Save image to file"""
+    try:
+        # Convert RGB to BGR for OpenCV
+        image_bgr = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
+        
+        # Create output directory if it doesn't exist
+        output_path.parent.mkdir(parents=True, exist_ok=True)
+        
+        # Save image
+        cv2.imwrite(str(output_path), image_bgr, [cv2.IMWRITE_JPEG_QUALITY, quality])
+        return True
+    except Exception as e:
+        print(f"Error saving image {output_path}: {e}")
+        return False
+
+def create_augmented_filename(original_path: Path, index: int, suffix: str = "aug") -> Path:
+    """Create filename for augmented image"""
+    stem = original_path.stem
+    suffix = f"_{suffix}_{index:02d}"
+    return original_path.parent / f"{stem}{suffix}{original_path.suffix}"
+
+def get_file_size_mb(file_path: Path) -> float:
+    """Get file size in MB"""
+    return file_path.stat().st_size / (1024 * 1024)
+
+def print_progress(current: int, total: int, prefix: str = "Progress"):
+    """Print progress bar"""
+    bar_length = 50
+    filled_length = int(round(bar_length * current / float(total)))
+    percents = round(100.0 * current / float(total), 1)
+    bar = '=' * filled_length + '-' * (bar_length - filled_length)
+    print(f'\r{prefix}: [{bar}] {percents}% ({current}/{total})', end='')
+    if current == total:
+        print() 
\ No newline at end of file