demo2

tien_nemo
Commit fec2e1e888ea619ea8b4c3d84f89bd1d332d4fdd fec2e1e8 1 parent 0a53c2c3
Showing 4 changed files with 149 additions and 36 deletions
app/Http/Controllers/OcrController.php
app/Services/OCR/extrac_table.py
app/Services/OCR/table_detector.py
resources/views/ocr/index.blade.php
--- a/app/Http/Controllers/OcrController.php
View file @fec2e1e
+++ b/app/Http/Controllers/OcrController.php
View file @fec2e1e
@@ -22,6 +22,7 @@ class OcrController extends Controller
             'customer_name_xy' => 'required|string',
         ]);
         $dataDetail = $request->fields ?? [];
+        $tableColumns = $request->table_columns ?? [];
         try {
             $masterTemplate = MstTemplate::updateOrCreate(
                 ['tpl_name' => $request->template_name],
@@ -49,6 +50,24 @@ class OcrController extends Controller
                 );
             }
+
+            // Lưu mapping cột bảng (lưu col index vào field_xy với field_name đặc biệt)
+            if (!empty($tableColumns) && is_array($tableColumns)) {
+                foreach ($tableColumns as $name => $colIdx) {
+                    if ($colIdx === null || $colIdx === '' || $colIdx === false) {
+                        continue;
+                    }
+                    DtTemplate::updateOrInsert(
+                        [
+                            'tpl_id'     => $masterTemplate->id,
+                            'field_name' => '__table_col__' . $name,
+                        ],
+                        [
+                            'field_xy' => (string) $colIdx,
+                        ]
+                    );
+                }
+            }
             return response()->json([
                 'success' => true,
                 'message' => 'Lưu template thành công',
@@ -70,8 +89,8 @@ class OcrController extends Controller
             $templateName = $request->get('template_name', '');
             // Giả sử file OCR JSON & ảnh nằm trong storage/app/public/image/
-            $jsonPath = public_path("image/3_1757295841_with_table.json");
+            $jsonPath = public_path("image/nemo_new_1757393338_with_table.json");
-            $imgPath = ("image/3_1757295841.jpg");
+            $imgPath = ("image/nemo_new_1757393338.jpg");
             if (!file_exists($jsonPath)) {
                 return response()->json(['error' => 'File OCR JSON không tìm thấy'], 404);
@@ -100,7 +119,13 @@ class OcrController extends Controller
                     // Lấy detail của template
                     $details = DtTemplate::where('tpl_id', $mst->id)->get();
+                    $tableColumnMapping = [];
                     foreach ($details as $detail) {
+                        if (strpos($detail->field_name, '__table_col__') === 0) {
+                            $name = substr($detail->field_name, strlen('__table_col__'));
+                            $tableColumnMapping[$name] = is_numeric($detail->field_xy) ? intval($detail->field_xy) : null;
+                            continue;
+                        }
                         $coords = array_map('intval', explode(',', $detail->field_xy));
                         // coords = [x1, y1, x2, y2]
@@ -130,6 +155,7 @@ class OcrController extends Controller
                 'pdfImageUrl' => $imgPath,
                 'dataMapping' => $dataMapping,
                 'is_template' => $is_template,
+                'tableColumnMapping' => $tableColumnMapping ?? [], //?? new \stdClass(),
                 'fieldOptions' => [
                     [ 'value' => 'template_name',  'label' => 'Tên Mẫu PDF' ],
                     [ 'value' => 'customer_name',  'label' => 'Tên khách hàng' ],
--- a/app/Services/OCR/extrac_table.py
View file @fec2e1e
+++ b/app/Services/OCR/extrac_table.py
View file @fec2e1e
@@ -11,14 +11,14 @@ from PIL import Image, ImageEnhance
 # ==== Config ====
 BASE_DIR = os.path.abspath(os.path.join(os.path.dirname(__file__), "..", "..", ".."))
-# PDF_NAME = 'aaaa'
+PDF_NAME = 'nemo_new'
 # PDF path
-pdf_path = Path(BASE_DIR) / "storage" / "pdf" / "3.pdf"
+pdf_path = Path(BASE_DIR) / "storage" / "pdf" / "2.pdf"
 # Output folder
 output_folder = Path(BASE_DIR) / "public" / "image"
-PDF_NAME = pdf_path.stem  # Get the stem of the PDF file
+# PDF_NAME = pdf_path.stem  # Get the stem of the PDF file
 #print(PDF_NAME)
 os.makedirs(output_folder, exist_ok=True)
@@ -151,9 +151,31 @@ for table in table_info:
             x1, y1, x2, y2 = cell["cell"]
             cell_texts = []
+            # Helper: compute overlap ratio of bbox against cell
+            def overlap_ratio(bbox, cell_box):
+                ix1 = max(bbox[0], cell_box[0])
+                iy1 = max(bbox[1], cell_box[1])
+                ix2 = min(bbox[2], cell_box[2])
+                iy2 = min(bbox[3], cell_box[3])
+                iw = max(0, ix2 - ix1)
+                ih = max(0, iy2 - iy1)
+                inter = iw * ih
+                bbox_area = max(1, (bbox[2] - bbox[0]) * (bbox[3] - bbox[1]))
+                return inter / float(bbox_area)
+
+            # Helper: check center inside cell
+            def center_inside(bbox, cell_box):
+                cx = (bbox[0] + bbox[2]) / 2.0
+                cy = (bbox[1] + bbox[3]) / 2.0
+                return (cx >= cell_box[0] and cx <= cell_box[2] and
+                        cy >= cell_box[1] and cy <= cell_box[3])
+
+            cell_box = [x1, y1, x2, y2]
             for item in ocr_data_list:
                 bx1, by1, bx2, by2 = item["bbox"]
-                if bx1 >= x1 and by1 >= y1 and bx2 <= x2 and by2 <= y2:
+                bbox = [bx1, by1, bx2, by2]
+                # Accept if bbox is largely inside the cell, or its center lies inside the cell
+                if overlap_ratio(bbox, cell_box) >= 0.3 or center_inside(bbox, cell_box):
                     cell_texts.append(item["text"])
             # thêm vào cell gốc
--- a/app/Services/OCR/table_detector.py
View file @fec2e1e
+++ b/app/Services/OCR/table_detector.py
View file @fec2e1e
@@ -2,46 +2,73 @@ import cv2
 import numpy as np
 import os
-def detect_tables(image_path):
+def filter_horizontal_lines(lines_h, img_width, min_h_len_ratio=0.8, tol_y=10):
+    if lines_h is None:
+        return [], []
+
+    ys_candidates = []
+    for l in lines_h:
+        x1, y1, x2, y2 = l[0]
+        if abs(y1 - y2) <= 3:  # ngang
+            line_len = abs(x2 - x1)
+            y_mid = int(round((y1 + y2) / 2))
+            ys_candidates.append((y_mid, line_len, x1, x2))
+
+    ys_candidates.sort(key=lambda x: x[0])
+    filtered_lines, line_segments, current_group = [], [], []
+
+    for y, length, x1, x2 in ys_candidates:
+        if not current_group:
+            current_group.append((y, length, x1, x2))
+        else:
+            if abs(y - current_group[-1][0]) <= tol_y:
+                current_group.append((y, length, x1, x2))
+            else:
+                longest = max(current_group, key=lambda x: x[1])
+                if longest[1] >= min_h_len_ratio * img_width:
+                    filtered_lines.append(longest[0])
+                    line_segments.append((longest[2], longest[3], longest[0]))
+                else:
+                    break
+                current_group = [(y, length, x1, x2)]
+
+    if current_group:
+        longest = max(current_group, key=lambda x: x[1])
+        if longest[1] >= min_h_len_ratio * img_width:
+            filtered_lines.append(longest[0])
+            line_segments.append((longest[2], longest[3], longest[0]))
+
+    total_rows = max(0, len(filtered_lines) - 1)
+    print(f"Detected {total_rows} rows")
+    return filtered_lines, line_segments
+
+
+def detect_tables(image_path, gap_threshold=50):
     img = cv2.imread(image_path)
     if img is None:
         raise FileNotFoundError(f"Không đọc được ảnh: {image_path}")
     gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
     blur = cv2.GaussianBlur(gray, (3, 3), 0)
-
-    # Edge detection
     edges = cv2.Canny(blur, 50, 150, apertureSize=3)
     # --- Horizontal lines ---
     lines_h = cv2.HoughLinesP(edges, 1, np.pi/180, threshold=120,
                               minLineLength=int(img.shape[1] * 0.6), maxLineGap=20)
-    ys_candidates, line_segments = [], []
+    img_height, img_width = img.shape[:2]
-    if lines_h is not None:
+    ys, line_segments = filter_horizontal_lines(lines_h, img_width, min_h_len_ratio=0.8, tol_y=10)
-        for l in lines_h:
-            x1, y1, x2, y2 = l[0]
-            if abs(y1 - y2) <= 3:  # ngang
-                y_mid = int(round((y1 + y2) / 2))
-                ys_candidates.append(y_mid)
-                line_segments.append((x1, x2, y_mid))
-
-    # gom nhóm y
-    ys, tol_y = [], 10
-    for y in sorted(ys_candidates):
-        if not ys or abs(y - ys[-1]) > tol_y:
-            ys.append(y)
-
     total_rows = max(0, len(ys) - 1)
     # --- Vertical lines ---
     lines_v = cv2.HoughLinesP(edges, 1, np.pi/180, threshold=100,
-                              minLineLength=int(img.shape[0] * 0.5), maxLineGap=20)
+                              minLineLength=int(img.shape[0] * 0.4), maxLineGap=20)
-    xs = []
+    v_lines, xs = [], []
     if lines_v is not None:
         for l in lines_v:
             x1, y1, x2, y2 = l[0]
             if abs(x1 - x2) <= 3:
                 xs.append(int(round((x1 + x2) / 2)))
+                v_lines.append((int(round((x1 + x2) / 2)), min(y1, y2), max(y1, y2)))
     # gom nhóm x
     x_pos, tol_v = [], 10
@@ -50,26 +77,66 @@ def detect_tables(image_path):
             x_pos.append(v)
     total_cols = max(0, len(x_pos) - 1)
-
     tables = []
+
     if total_rows > 0 and total_cols > 0:
         y_min, y_max = ys[0], ys[-1]
         x_min, x_max = x_pos[0], x_pos[-1]
         table_box = (x_min, y_min, x_max, y_max)
-        # build cells
         rows_data = []
         for i in range(total_rows):
             row_cells = []
-            for j in range(total_cols):
+            j = 0
+            while j < total_cols:
                 cell_box = (x_pos[j], ys[i], x_pos[j+1], ys[i+1])
+                row_height = cell_box[3] - cell_box[1]
+
+                # Check vertical line coverage (>=70% chiều cao hàng)
+                has_left = any(
+                    abs(x - cell_box[0]) <= tol_v and
+                    (min(y_end, cell_box[3]) - max(y_start, cell_box[1])) >= 0.7 * row_height
+                    for x, y_start, y_end in v_lines
+                )
+                has_right = any(
+                    abs(x - cell_box[2]) <= tol_v and
+                    (min(y_end, cell_box[3]) - max(y_start, cell_box[1])) >= 0.7 * row_height
+                    for x, y_start, y_end in v_lines
+                )
+
+                if has_left and has_right:
+                    col_start = j
+                    col_end = j
+                    # nếu cột tiếp theo không có line → merge
+                    while col_end + 1 < total_cols:
+                        next_box = (x_pos[col_end+1], ys[i], x_pos[col_end+2], ys[i+1])
+                        has_next_left = any(
+                            abs(x - next_box[0]) <= tol_v and
+                            (min(y_end, next_box[3]) - max(y_start, next_box[1])) >= 0.7 * row_height
+                            for x, y_start, y_end in v_lines
+                        )
+                        if not has_next_left:  # merge tiếp
+                            col_end += 1
+                        else:
+                            break
+
+                    merged_box = (x_pos[col_start], ys[i], x_pos[col_end+1], ys[i+1])
+                    if col_start == col_end:
+                        col_id = col_start
+                    else:
+                        col_id = f"{col_start}-{col_end}"
+
                     row_cells.append({
-                    "cell": cell_box,
+                        "cell": merged_box,
                         "row_idx": i,
-                    "col_idx": j
+                        "col_idx": col_id
                     })
-                # Vẽ ô
+                    cv2.rectangle(img, (merged_box[0], merged_box[1]),
-                cv2.rectangle(img, (cell_box[0], cell_box[1]), (cell_box[2], cell_box[3]), (0, 255, 255), 1)
+                                  (merged_box[2], merged_box[3]), (0, 255, 255), 1)
+                    j = col_end + 1
+                else:
+                    j += 1  # skip ô lỗi (không có line đầy đủ)
+
             rows_data.append(row_cells)
         tables.append({
@@ -78,11 +145,9 @@ def detect_tables(image_path):
             "table_box": table_box,
             "cells": rows_data
         })
-
-        # vẽ viền bảng
         cv2.rectangle(img, (x_min, y_min), (x_max, y_max), (255, 0, 0), 2)
-    debug_path = os.path.splitext(image_path)[0] + "_debug.jpg"
+    debug_path = os.path.splitext(image_path)[0] + "_fix_debug.jpg"
     cv2.imwrite(debug_path, img)
     return tables
--- a/resources/views/ocr/index.blade.php
View file @fec2e1e
+++ b/resources/views/ocr/index.blade.php
View file @fec2e1e