ttop32
diff --git a/‎README.md‎
Lines changed: 1 addition & 1 deletion b/‎README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/ocr/ocrView.js‎
Lines changed: 47 additions & 16 deletions b/‎src/ocr/ocrView.js‎
Lines changed: 47 additions & 16 deletions
diff --git a/‎src/ocr/opencvHandler.js‎
Lines changed: 121 additions & 10 deletions b/‎src/ocr/opencvHandler.js‎
Lines changed: 121 additions & 10 deletions
@@ -18,7 +18,7 @@ Download from [chrome web store](https://chromewebstore.google.com/detail/hmigni
 ![Alt Text](doc/result1532.gif)
 ![result](doc/screenshot_3.png)
 ![result](doc/screenshot_6.png) 
-![OCR Result](doc/ocr_result.png)
+![OCR Result](doc/ocr_result1.gif)
 
 # Features
 
 
@@ -14,19 +14,22 @@ const windowPostMessageProxy = new WindowPostMessageProxy({
 var ocrHistory = {};
 var iFrames = {};
 var ocrResultHistory = {}; // store ocr result to avoid duplicate request
+var translatorHistory = {}; // Store translation history to avoid duplicate translations
 var setting;
 var ocrFrameName = "ocrFrame";
 var opencvFrameName = "opencvFrame";
 // var ocrFrameName="ocrFrameDebug"
 // var opencvFrameName="opencvFrameDebug";
+const textSimilarityThreshold = 0.8; // Threshold for text similarity
+var textLengthMultiplier = 7; // Multiplier for text length gap filtering
 
 //detect mouse positioned image to process ocr in ocr.html iframe
 //create text box from ocr result
-export async function checkImage(x,y, currentSetting, keyDownList) {
+export async function checkImage(x, y, currentSetting, keyDownList) {
   // if  ocr is not on or no key bind, skip
   // if mouse target is not image, skip
   // if already ocr processed,skip
-  var img=util.deepElementFromPoint(x, y);
+  var img = util.deepElementFromPoint(x, y);
   if (
     !keyDownList[currentSetting["keyDownOCR"]] ||
     !checkIsImage(img) ||
@@ -36,6 +39,8 @@ export async function checkImage(x,y, currentSetting, keyDownList) {
   }
   setting = currentSetting;
   ocrHistory[img.src] = img;
+  translatorHistory[img.src] = [];
+  ocrResultHistory[img.src] = [];
   var lang = setting["ocrLang"];
   makeLoadingMouseStyle(img);
 
@@ -64,6 +69,14 @@ export async function checkImage(x,y, currentSetting, keyDownList) {
       "ORANGE",
       "bbox_white_useOpencvImg"
     ),
+    processOcr(
+      img.src,
+      lang,
+      base64Url,
+      img,
+      "PURPLE",
+      "bbox_black_useOpencvImg"
+    ),
   ]);
 
   makeNormalMouseStyle(img);
@@ -79,6 +92,7 @@ export function removeAllOcrEnv() {
   ocrHistory = {};
   hideAll({ duration: 0 });
   ocrResultHistory = {};
+  translatorHistory = {};
 }
 
 async function processOcr(mainUrl, lang, base64Url, img, color, mode = "auto") {
@@ -91,15 +105,15 @@ async function processOcr(mainUrl, lang, base64Url, img, color, mode = "auto") {
   // OCR process with opencv, then display
   if (mode.includes("bbox")) {
     // console.time("OCR Process with OpenCV"+mode);
-    var { bboxList, base64Url, ratio ,opencvImg } = await requestSegmentBox(
+    var { bboxList, base64Url, ratio, opencvImg } = await requestSegmentBox(
       mainUrl,
       lang,
       base64Url,
       mode
     );
     // console.timeEnd("OCR Process with OpenCV"+mode);
   }
-  
+
   await Promise.all(
     bboxList.map(async (bbox) => {
       var res = await requestOcr(mainUrl, lang, [bbox], base64Url, mode);
@@ -141,19 +155,19 @@ async function createIframe(name, htmlPath) {
 }
 
 function loadScript(name, htmlPath) {
-  var debugCSS={
+  var debugCSS = {
     width: "700",
     height: "700",
     pointerEvents: "auto",
     opacity: 1.0,
-  }
+  };
   var iFrameCSS = {
     width: "1",
     height: "1",
     pointerEvents: "none",
     opacity: 0.0,
   };
-  
+
   return new Promise(function (resolve, reject) {
     var iFrame = $("<iframe />", {
       name: name,
@@ -214,14 +228,30 @@ async function showOcrData(img, ocrData, ratio, color) {
 
 async function showTooltipBoxes(img, textBoxList) {
   var filteredTextBoxList = filterDuplicateOcr(img, textBoxList);
+
   for (var textBox of filteredTextBoxList) {
     var { targetText, sourceLang, targetLang } = await handleTranslate(
       textBox["text"]
     );
-    // filter large translate text len gap
-    if(targetText.length >textBox["text"].length*7){
+
+    const isAlreadyTranslated = translatorHistory[img.src].some(
+      (prevTargetText) => {
+        return (
+          calculateTextSimilarity(prevTargetText, targetText) >
+          textSimilarityThreshold
+        );
+      }
+    );
+
+    // Filter large translate text length gap
+    if (
+      targetText.length > textBox["text"].length * textLengthMultiplier ||
+      isAlreadyTranslated
+    ) {
       continue;
     }
+
+    translatorHistory[img.src].push(targetText);
     addTooltipBox(img, textBox, targetText, targetLang);
   }
 }
@@ -254,11 +284,7 @@ function calculateTextSimilarity(text1, text2) {
 
 function filterDuplicateOcr(img, textBoxList) {
   // Ensure ocrResultHistory exists for the image
-  if (!ocrResultHistory[img.src]) {
-    ocrResultHistory[img.src] = [];
-  }
   const bboxThreshold = 15; // Threshold for bounding box similarity (bbox is a common term in OCR)
-  const textSimilarityThreshold = 0.8; // Threshold for text similarity (e.g., Levenshtein distance ratio)
 
   // Filter out text boxes that are similar to previous history
   const filteredTextBoxList = textBoxList.filter((textBox) => {
@@ -293,10 +319,12 @@ function adjustTextBoxBbox(textBox, ratio) {
   textBox["bbox"]["y1"] = Math.ceil(textBox["bbox"]["y1"] / ratio);
 }
 
-
 function addTooltipBox(img, textBox, text, targetLang) {
   // Create a tooltip element using Tippy.js
-  var tooltipWidth = textBox["bbox"]["x1"] - textBox["bbox"]["x0"];
+  var tooltipWidth = Math.max(
+    200,
+    textBox["bbox"]["x1"] - textBox["bbox"]["x0"]
+  );
   const tooltipContent = $("<span/>", {
     text: text,
     css: {
@@ -377,7 +405,10 @@ function addTooltipBox(img, textBox, text, targetLang) {
   });
 
   $(window).on("resize", () => {
-    const { left, top, width, height } = calculateImgSegBoxSize(img, textBox["bbox"]);
+    const { left, top, width, height } = calculateImgSegBoxSize(
+      img,
+      textBox["bbox"]
+    );
     tooltipTarget.css({
       left: `${left}px`,
       top: `${top + height * 0.7}px`,
 
@@ -117,6 +117,113 @@ function detectText(canvasIn, mode) {
     var ksize = new cv.Size(12, 12);
     var element = cv.getStructuringElement(cv.MORPH_RECT, ksize);
     cv.cvtColor(src, dst, cv.COLOR_RGBA2GRAY, 0);
+  } else if (mode.includes("black")) {
+    var ksize = new cv.Size(15, 15);
+    var element = cv.getStructuringElement(cv.MORPH_RECT, ksize);
+
+    cv.bitwise_not(src, src);
+
+    // Convert image to grayscale and ensure single-channel
+    cv.cvtColor(src, dst, cv.COLOR_RGBA2GRAY, 0);
+    // Threshold to get white areas (255, 255, 255)
+
+    //get white area as mask
+    cv.threshold(dst, dst, 210, 255, cv.THRESH_BINARY);
+    // showImage(dst, mode);
+
+    // Create floodfill masks for each edge
+    let combinedFloodMask = new cv.Mat(
+      dst.rows,
+      dst.cols,
+      cv.CV_8U,
+      new cv.Scalar(0)
+    );
+    var combinedFloodVisited = new Set();
+    combinedFloodMask = customFloodFillWithoutCv(
+      dst,
+      { x: 0, y: 0 },
+      combinedFloodMask,
+      combinedFloodVisited
+    );
+    combinedFloodMask = customFloodFillWithoutCv(
+      dst,
+      { x: dst.cols - 1, y: 0 },
+      combinedFloodMask,
+      combinedFloodVisited
+    );
+    combinedFloodMask = customFloodFillWithoutCv(
+      dst,
+      { x: 0, y: dst.rows - 1 },
+      combinedFloodMask,
+      combinedFloodVisited
+    );
+    combinedFloodMask = customFloodFillWithoutCv(
+      dst,
+      { x: dst.cols - 1, y: dst.rows - 1 },
+      combinedFloodMask,
+      combinedFloodVisited
+    );
+    // showImage(combinedFloodMask, mode);
+    // Remove mask area that exists in combinedFloodMask
+    cv.bitwise_not(dst, dst);
+    cv.bitwise_or(dst, combinedFloodMask, dst);
+    cv.bitwise_not(dst, dst);
+
+    // cv.bitwise_not(dst, dst); // Invert the image to get black areas
+    // cv.bitwise_not(combinedFloodMask, combinedFloodMask); // Invert the image to get black areas
+    // cv.bitwise_and(dst, dst, dst, combinedFloodMask); // Apply the mask to the original image grep white area as mask
+    // cv.bitwise_not(dst, dst); // Invert the image to get black areas again
+
+    // showImage(dst, mode);
+
+    // // Apply the mask to the original image grep white area as mask
+    // let mask = new cv.Mat();
+    // cv.bitwise_and(src, src, mask, dst);
+    // showImage(mask, mode);
+
+    // make invert white area using floodfill
+    // dst = mask.clone(); // Update dst to the masked image
+
+    cv.copyMakeBorder(
+      dst,
+      dst,
+      1,
+      1,
+      1,
+      1,
+      cv.BORDER_CONSTANT,
+      new cv.Scalar(0)
+    );
+    // Flood fill the mask to get the white area
+    let floodFillMask = customFloodFillWithoutCv(dst, { x: 0, y: 0 });
+    cv.bitwise_not(floodFillMask, floodFillMask);
+    floodFillMask = floodFillMask.roi(
+      new cv.Rect(1, 1, floodFillMask.cols - 2, floodFillMask.rows - 2)
+    );
+    let slicedResultMask = new cv.Mat();
+    cv.bitwise_and(src, src, slicedResultMask, floodFillMask);
+
+    // showImage(slicedResultMask, mode);
+    // // make white background and combine with slicedResultMask
+    cv.bitwise_not(floodFillMask, floodFillMask);
+    cv.cvtColor(floodFillMask, floodFillMask, cv.COLOR_GRAY2RGBA, 0);
+    cv.bitwise_or(slicedResultMask, floodFillMask, floodFillMask);
+    // showImage(floodFillMask, mode);
+
+    // Enhance color saturation
+    let enhancedImage = new cv.Mat();
+    cv.cvtColor(floodFillMask, enhancedImage, cv.COLOR_RGBA2RGB, 0);
+    cv.convertScaleAbs(enhancedImage, enhancedImage, 2.1, 0); // Increase intensity
+    cv.bitwise_not(enhancedImage, enhancedImage); // Ivert colors
+    cv.convertScaleAbs(enhancedImage, enhancedImage, 1.5, 0); // Adjust intensity
+    cv.bitwise_not(enhancedImage, enhancedImage); // Invert colors
+    preprocessedSourceImage = enhancedImage;
+    
+    // showImage(preprocessedSourceImage, mode);
+    // Update src and dst with the sliced result
+    src = floodFillMask;
+    dst = preprocessedSourceImage.clone();
+    cv.cvtColor(dst, dst, cv.COLOR_RGBA2GRAY, 0);
   } else if (mode.includes("white")) {
     var ksize = new cv.Size(15, 15);
     var element = cv.getStructuringElement(cv.MORPH_RECT, ksize);
@@ -129,7 +236,7 @@ function detectText(canvasIn, mode) {
     //get white area as mask
     cv.threshold(dst, dst, 230, 255, cv.THRESH_BINARY);
 
-      // showImage(dst, mode);
+    // showImage(dst, mode);
     // Combine all masks into one
     let combinedFloodMask = new cv.Mat(
       dst.rows,
@@ -172,13 +279,13 @@ function detectText(canvasIn, mode) {
     cv.bitwise_not(dst, dst);
 
     // Apply the mask to the original image grep white area as mask
-    let mask = new cv.Mat();
-    cv.bitwise_and(src, src, mask, dst);
+    // let mask = new cv.Mat();
+    // cv.bitwise_and(src, src, mask, dst);
 
     // showImage(mask, mode);
 
     // make invert white area using floodfill
-    dst = mask.clone(); // Update dst to the masked image
+    // dst = mask.clone(); // Update dst to the masked image
     cv.copyMakeBorder(
       dst,
       dst,
@@ -211,7 +318,6 @@ function detectText(canvasIn, mode) {
     cv.bitwise_or(slicedResultMask, slicedBorderMask, slicedBorderMask);
     // showImage(slicedBorderMask, mode);
 
-
     // Enhance color saturation
     let enhancedImage = new cv.Mat();
     cv.cvtColor(slicedBorderMask, enhancedImage, cv.COLOR_RGBA2RGB, 0);
@@ -220,6 +326,7 @@ function detectText(canvasIn, mode) {
     cv.convertScaleAbs(enhancedImage, enhancedImage, 1.5, 0); // Adjust intensity
     cv.bitwise_not(enhancedImage, enhancedImage); // Invert colors
     preprocessedSourceImage = enhancedImage;
+    // showImage(preprocessedSourceImage, mode);
 
     // Update src and dst with the sliced result
     src = slicedBorderMask;
@@ -309,11 +416,11 @@ function detectText(canvasIn, mode) {
       rectCoverRatio < 0.15 ||
       cnt.rows < 100 ||
       area < 150 ||
-      !isRightAngle ||
-      left == 0 ||
-      top == 0 ||
-      left + width == w ||
-      top + height == h
+      !isRightAngle
+      // left == 0 ||
+      // top == 0
+      // left + width == w ||
+      // top + height == h
     ) {
       continue;
     }
@@ -434,6 +541,8 @@ function preprocessImage(canvasIn, isResize) {
 }
 
 function customFloodFillWithoutCv(image, startPoint, mask, visited) {
+  // console.time("customFloodFillWithoutCv");
+
   let rows = image.rows;
   let cols = image.cols;
   var mask = mask || new cv.Mat(rows, cols, cv.CV_8U, new cv.Scalar(0));
@@ -463,6 +572,8 @@ function customFloodFillWithoutCv(image, startPoint, mask, visited) {
       { x, y: y - 1 }
     );
   }
+
+  // console.timeEnd("customFloodFillWithoutCv");
   return mask;
 }