MVP on OCT and webcam

2024-08-21 16:35:56 -07:00 · 2024-08-21 16:35:56 -07:00 · 6b17ec50d4
commit 6b17ec50d4
parent 5fc716c954
12 changed files with 145 additions and 0 deletions
--- a/frame_1.png
+++ b/frame_1.png
--- a/frame_10.png
+++ b/frame_10.png
--- a/frame_2.png
+++ b/frame_2.png
--- a/frame_3.png
+++ b/frame_3.png
--- a/frame_4.png
+++ b/frame_4.png
--- a/frame_5.png
+++ b/frame_5.png
--- a/frame_6.png
+++ b/frame_6.png
--- a/frame_7.png
+++ b/frame_7.png
--- a/frame_8.png
+++ b/frame_8.png
--- a/frame_9.png
+++ b/frame_9.png
--- a/main.py
+++ b/main.py
@ -0,0 +1,70 @@
+import cv2
+import easyocr
+import numpy as np
+from PIL import Image
+from collections import Counter
+
+# Initialize the EasyOCR reader
+reader = easyocr.Reader(['en'])
+
+def preprocess_image(image):
+    # Convert to PIL image for EasyOCR processing
+    return Image.fromarray(cv2.cvtColor(image, cv2.COLOR_BGR2RGB))
+
+def recognize_text(image):
+    processed_image = preprocess_image(image)
+    results = reader.readtext(np.array(processed_image), allowlist='0123456789')
+    # Concatenate all recognized text results
+    recognized_text = ''.join(result[1] for result in results)
+    return recognized_text
+
+def format_number(text, length=6):
+    # Remove non-numeric characters and pad with zeros if necessary
+    formatted = ''.join(filter(str.isdigit, text))
+    return formatted.zfill(length)[-length:]
+
+def most_common_number(numbers):
+    # Find the most common number from the list of numbers
+    counter = Counter(numbers)
+    most_common = counter.most_common(1)
+    return most_common[0][0] if most_common else ''
+
+def main():
+    cap = cv2.VideoCapture(2)
+
+    if not cap.isOpened():
+        print("Error: Could not open webcam.")
+        return
+
+    print("Press 'q' to quit.")
+    frame_count = 0
+    text_history = []
+
+    while True:
+        ret, frame = cap.read()
+        if not ret:
+            print("Error: Failed to capture image.")
+            break
+
+        # Recognize text from the current frame
+        recognized_text = recognize_text(frame)
+        formatted_number = format_number(recognized_text)
+
+        # Update the history with the latest recognized number
+        text_history.append(formatted_number)
+
+        # Keep only the last 10 frames
+        if len(text_history) > 20:
+            text_history.pop(0)
+
+        # Determine the most common number from the history
+        most_common = most_common_number(text_history)
+        print(f"Most common number from last 10 frames: {most_common}")
+
+        # if cv2.waitKey(1) & 0xFF == ord('q'):
+        #     break
+
+    cap.release()
+
+if __name__ == "__main__":
+    main()
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,75 @@
+absl-py==2.1.0
+astunparse==1.6.3
+certifi==2024.7.4
+charset-normalizer==3.3.2
+easyocr==1.7.1
+filelock==3.15.4
+flatbuffers==24.3.25
+fsspec==2024.6.1
+gast==0.6.0
+google-pasta==0.2.0
+grpcio==1.65.5
+h5py==3.11.0
+idna==3.7
+imageio==2.35.1
+Jinja2==3.1.4
+joblib==1.4.2
+keras==3.5.0
+lazy_loader==0.4
+libclang==18.1.1
+Markdown==3.7
+markdown-it-py==3.0.0
+MarkupSafe==2.1.5
+mdurl==0.1.2
+ml-dtypes==0.4.0
+mpmath==1.3.0
+namex==0.0.8
+networkx==3.3
+ninja==1.11.1.1
+numpy==1.26.4
+nvidia-cublas-cu12==12.1.3.1
+nvidia-cuda-cupti-cu12==12.1.105
+nvidia-cuda-nvrtc-cu12==12.1.105
+nvidia-cuda-runtime-cu12==12.1.105
+nvidia-cudnn-cu12==9.1.0.70
+nvidia-cufft-cu12==11.0.2.54
+nvidia-curand-cu12==10.3.2.106
+nvidia-cusolver-cu12==11.4.5.107
+nvidia-cusparse-cu12==12.1.0.106
+nvidia-nccl-cu12==2.20.5
+nvidia-nvjitlink-cu12==12.6.20
+nvidia-nvtx-cu12==12.1.105
+opencv-python==4.10.0.84
+opencv-python-headless==4.10.0.84
+opt-einsum==3.3.0
+optree==0.12.1
+packaging==24.1
+pillow==10.4.0
+protobuf==4.25.4
+pyclipper==1.3.0.post5
+Pygments==2.18.0
+pytesseract==0.3.13
+python-bidi==0.6.0
+PyYAML==6.0.2
+requests==2.32.3
+rich==13.7.1
+scikit-image==0.24.0
+scikit-learn==1.5.1
+scipy==1.14.1
+shapely==2.0.6
+six==1.16.0
+sympy==1.13.2
+tensorboard==2.17.1
+tensorboard-data-server==0.7.2
+tensorflow==2.17.0
+tensorflow-io-gcs-filesystem==0.37.1
+termcolor==2.4.0
+threadpoolctl==3.5.0
+tifffile==2024.8.10
+torch==2.4.0
+torchvision==0.19.0
+triton==3.0.0
+typing_extensions==4.12.2
+urllib3==2.2.2
+Werkzeug==3.0.4
+wrapt==1.16.0