PyPI - ytcollector - Versions diffs - 1.1.1__tar.gz → 1.1.2__tar.gz - Mend

ytcollector 1.1.1tar.gz → 1.1.2tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

{ytcollector-1.1.1 → ytcollector-1.1.2}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: ytcollector
-Version: 1.1.1
+Version: 1.1.2
 Summary: YouTube 콘텐츠 수집기 - 얼굴, 번호판, 타투, 텍스트 감지
 Author: YTCollector Team
 License: MIT
@@ -24,6 +24,7 @@ Provides-Extra: analysis
 Requires-Dist: opencv-python>=4.5.0; extra == "analysis"
 Requires-Dist: easyocr>=1.6.0; extra == "analysis"
 Requires-Dist: numpy>=1.20.0; extra == "analysis"
+Requires-Dist: ultralytics>=8.0.0; extra == "analysis"
 Provides-Extra: dev
 Requires-Dist: pytest>=7.0.0; extra == "dev"
 Requires-Dist: black>=23.0.0; extra == "dev"
@@ -46,7 +47,9 @@ pip install yt-dlp
 ### 분석 기능용 패키지 (권장)
 ```bash
-pip install opencv-python easyocr numpy
+pip install opencv-python easyocr numpy ultralytics
+# YOLO-World 기능을 사용하려면 아래 CLIP 라이브러리 수동 설치가 필요합니다.
+pip install "git+https://github.com/ultralytics/CLIP.git"
 ```
 ## 사용법
@@ -184,9 +187,9 @@ https://www.youtube.com/watch?v=aqz-KE-bpKQ, 00:10, sample_task
 | 감지 항목 | 사용 기술 | 설명 |
 |-----------|-----------|------|
 | 얼굴 | OpenCV Haar Cascade | 정면 얼굴 감지 |
-| 텍스트 | EasyOCR | 한국어/영어 문자 인식 |
-| 번호판 | EasyOCR + 정규식 | 번호판 패턴 매칭 |
-| 타투 | OpenCV HSV 분석 | 피부 영역 내 잉크 패턴 |
+| 텍스트 | EasyOCR | 한국어/영어 문자 인식 (분석 품질 및 프레임 수 개선) |
+| 번호판 | YOLO-World + OCR | YOLO-World 기반 시각적 감지 + OCR 매칭 |
+| 타투 | OpenCV HSV 분석 | 피부 영역 내 잉크 패턴 감지 |
 ## 주의사항

{ytcollector-1.1.1 → ytcollector-1.1.2}/README.md RENAMED Viewed

@@ -13,7 +13,9 @@ pip install yt-dlp
 ### 분석 기능용 패키지 (권장)
 ```bash
-pip install opencv-python easyocr numpy
+pip install opencv-python easyocr numpy ultralytics
+# YOLO-World 기능을 사용하려면 아래 CLIP 라이브러리 수동 설치가 필요합니다.
+pip install "git+https://github.com/ultralytics/CLIP.git"
 ```
 ## 사용법
@@ -151,9 +153,9 @@ https://www.youtube.com/watch?v=aqz-KE-bpKQ, 00:10, sample_task
 | 감지 항목 | 사용 기술 | 설명 |
 |-----------|-----------|------|
 | 얼굴 | OpenCV Haar Cascade | 정면 얼굴 감지 |
-| 텍스트 | EasyOCR | 한국어/영어 문자 인식 |
-| 번호판 | EasyOCR + 정규식 | 번호판 패턴 매칭 |
-| 타투 | OpenCV HSV 분석 | 피부 영역 내 잉크 패턴 |
+| 텍스트 | EasyOCR | 한국어/영어 문자 인식 (분석 품질 및 프레임 수 개선) |
+| 번호판 | YOLO-World + OCR | YOLO-World 기반 시각적 감지 + OCR 매칭 |
+| 타투 | OpenCV HSV 분석 | 피부 영역 내 잉크 패턴 감지 |
 ## 주의사항

{ytcollector-1.1.1 → ytcollector-1.1.2}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "ytcollector"
-version = "1.1.1"
+version = "1.1.2"
 description = "YouTube 콘텐츠 수집기 - 얼굴, 번호판, 타투, 텍스트 감지"
 readme = "README.md"
 requires-python = ">=3.8"
@@ -34,6 +34,7 @@ analysis = [
     "opencv-python>=4.5.0",
     "easyocr>=1.6.0",
     "numpy>=1.20.0",
+    "ultralytics>=8.0.0",
 ]
 dev = [
     "pytest>=7.0.0",

{ytcollector-1.1.1 → ytcollector-1.1.2}/ytcollector/analyzer.py RENAMED Viewed

@@ -21,6 +21,15 @@ try:
 except ImportError:
     NUMPY_AVAILABLE = False
+try:
+    from ultralytics import YOLOWorld
+    YOLO_AVAILABLE = True
+except ImportError:
+    YOLOWorld = None
+    YOLO_AVAILABLE = False
+from .config import LICENSE_PLATE_PATTERNS, YOLO_MODEL_NAME, YOLO_CONFIDENCE, YOLO_PROMPTS
 class VideoAnalyzer:
     """영상 분석 클래스 - 얼굴, 텍스트, 번호판, 타투 감지"""
@@ -30,6 +39,7 @@ class VideoAnalyzer:
     def __init__(self):
         self.ocr_reader = None
         self.face_cascade = None
+        self.yolo_model = None
         if CV2_AVAILABLE:
             cascade_path = cv2.data.haarcascades + 'haarcascade_frontalface_default.xml'
@@ -43,6 +53,16 @@ class VideoAnalyzer:
                     print("  OCR 엔진 초기화 중...")
                     self.ocr_reader = easyocr.Reader(['ko', 'en'], gpu=False, verbose=False)
+    def _init_yolo(self):
+        """YOLO-World 모델 초기화 (필요할 때만, 스레드 안전)"""
+        if YOLO_AVAILABLE and self.yolo_model is None:
+            with self._ocr_lock:
+                if self.yolo_model is None:
+                    print(f"  YOLO-World 모델({YOLO_MODEL_NAME}) 로딩 중...")
+                    self.yolo_model = YOLOWorld(YOLO_MODEL_NAME)
+                    # 감지할 클래스(프롬프트) 설정
+                    self.yolo_model.set_classes(YOLO_PROMPTS)
     def extract_frames(self, video_path, num_frames=10):
         """영상에서 균등 간격으로 프레임 추출"""
         if not CV2_AVAILABLE:
@@ -87,23 +107,68 @@ class VideoAnalyzer:
         self._init_ocr()
         try:
             h, w = frame.shape[:2]
-            if w > 640:
-                scale = 640 / w
-                frame = cv2.resize(frame, (640, int(h * scale)))
+            # 가독성 개선을 위해 1080p 수준으로 리사이즈 (너무 작으면 인식률 저하)
+            if w > 1280:
+                scale = 1280 / w
+                frame = cv2.resize(frame, (1280, int(h * scale)), interpolation=cv2.INTER_LANCZOS4)
+            elif w < 640:
+                # 너무 작은 경우 확대
+                scale = 960 / w
+                frame = cv2.resize(frame, (960, int(h * scale)), interpolation=cv2.INTER_CUBIC)
+            # 전처리: 그레이스케일 및 대비 강화 (옵션)
+            gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+            clahe = cv2.createCLAHE(clipLimit=2.0, tileGridSize=(8,8))
+            processed = clahe.apply(gray)
             with self._ocr_lock:
-                results = self.ocr_reader.readtext(frame)
-            return [r[1] for r in results if r[2] > 0.3]
-        except:
+                # 원본(컬러)과 전처리(그레이) 중 선택 가능하나 보통 EasyOCR은 컬러에서 잘 작동함
+                # 대비 강화된 그레이스케일을 사용해봄
+                results = self.ocr_reader.readtext(processed)
+            # 신뢰도 임계값 0.25로 약간 하향 조정 (기존 0.3)
+            return [r[1] for r in results if r[2] > 0.25]
+        except Exception as e:
+            print(f"  ⚠ OCR 에러: {e}")
             return []
-    def detect_license_plate(self, texts):
-        """텍스트에서 번호판 패턴 감지"""
+    def detect_license_plate(self, texts, frame=None):
+        """텍스트에서 번호판 패턴 감지 및 YOLO-World 보조 감지"""
+        # 1. YOLO-World로 번호판 영역 확인
+        if YOLO_AVAILABLE and frame is not None:
+            try:
+                self._init_yolo()
+                if self.yolo_model:
+                    results = self.yolo_model(frame, verbose=False, conf=YOLO_CONFIDENCE)
+                    for r in results:
+                        # YOLO-World 클래스 인덱스는 YOLO_PROMPTS 순서와 같음
+                        # 0: license plate, 1: tattoo, 2: face (config 기준)
+                        if any(box.cls == 0 for box in r.boxes):
+                            # 번호판이 감지됨 -> 텍스트가 조금이라도 있으면 통과
+                            if texts: return True
+                            # 텍스트가 없어도 신뢰도가 높으면 감지된 것으로 간주 (옵션)
+                            if any(box.conf > 0.5 for box in r.boxes if box.cls == 0):
+                                return True
+            except:
+                pass
+        if not texts:
+            return False
+        # 2. 개별 텍스트 박스 체크
         for text in texts:
-            text_clean = text.replace(' ', '').upper()
+            text_clean = re.sub(r'[^0-9가-힣]', '', text)
             for pattern in LICENSE_PLATE_PATTERNS:
                 if re.search(pattern, text_clean):
                     return True
+        # 3. 프레임 내 모든 텍스트 결합 후 체크 (번호판이 쪼개진 경우 대응)
+        combined_text = "".join([re.sub(r'[^0-9가-힣]', '', t) for t in texts])
+        for pattern in LICENSE_PLATE_PATTERNS:
+            if re.search(pattern, combined_text):
+                return True
         return False
     def detect_tattoo(self, frame):
@@ -175,7 +240,12 @@ class VideoAnalyzer:
         total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
         cap.release()
-        num_analysis_frames = 10
+        # 분석 프레임 수 증가 (10 -> 20)
+        num_analysis_frames = 20
+        # 영상이 아주 긴 경우(10분 이상) 더 많은 프레임 추출
+        if total_frames / fps > 600:
+            num_analysis_frames = 30
         frame_indices = [int(i * total_frames / (num_analysis_frames + 1)) for i in range(1, num_analysis_frames + 1)]
         all_texts = []
@@ -198,12 +268,16 @@ class VideoAnalyzer:
                 total_faces += len(faces)
                 detected_now = True
-            # 텍스트
+            # 텍스트 및 번호판
             texts = self.detect_text(frame)
             if texts:
                 results['text'] = True
                 all_texts.extend(texts)
                 detected_now = True
+                # 번호판 감지 (프레임별로 결합 텍스트 및 YOLO 확인)
+                if self.detect_license_plate(texts, frame=frame):
+                    results['license_plate'] = True
             # 타투
             if self.detect_tattoo(frame):
@@ -218,9 +292,7 @@ class VideoAnalyzer:
         cap.release()
-        # 번호판 (텍스트에서)
         if all_texts:
-            results['license_plate'] = self.detect_license_plate(all_texts)
             results['detected_texts'] = list(set(all_texts))[:10]
         results['face_count'] = total_faces

{ytcollector-1.1.1 → ytcollector-1.1.2}/ytcollector/cli.py RENAMED Viewed

@@ -74,7 +74,7 @@ def create_parser():
     parser.add_argument(
         '-v', '--version',
         action='version',
-        version='%(prog)s 1.1.1'
+        version='%(prog)s 1.1.2'
     )
     parser.add_argument(
         '--check-deps',

{ytcollector-1.1.1 → ytcollector-1.1.2}/ytcollector/config.py RENAMED Viewed

@@ -37,14 +37,10 @@ CATEGORY_QUERIES = {
     ],
     'text': [
         "SBS 런닝맨 레전드",
-        "SBS 미운우리새끼 명장면",
-        "SBS 동상이몽 클립",
-        "SBS 집사부일체 모음",
-        "SBS 골목식당 레전드",
-        "SBS 맛남의광장 클립",
-        "SBS 불타는청춘 명장면",
-        "SBS 정글의법칙 레전드",
-        "SBS 예능",
+        "SBS 예능 쇼츠",
+        "재미있는 자막 영상 쇼츠",
+        "SBS 파워FM 보이는 라디오",
+        "SBS 연예대상 소감",
     ],
 }
@@ -61,6 +57,9 @@ BLACKLIST_KEYWORDS = {
         "두피 문신", "두피문신",
         "눈썹 문신", "눈썹문신",
         "입술 문신", "입술문신",
+        "립타투", "립 타투",
+        "헤어타투", "헤어 타투",
+        "구레나룻문신", "구레나룻 문신",
         "틴트 입술",
         "반영구", "SMP"
     ],
@@ -69,12 +68,21 @@ BLACKLIST_KEYWORDS = {
     'text': []
 }
-# 번호판 정규식 패턴
+# YOLO 설정
+YOLO_MODEL_NAME = 'yolov8s-world.pt' # YOLO-World 모델 (Open Vocabulary)
+YOLO_CONFIDENCE = 0.3                # YOLO-World는 임계값을 약간 낮게 설정 가능
+YOLO_PROMPTS = ["license plate"]
+# 번호판 정규식 패턴 (한국 자동차 번호판 중심)
 LICENSE_PLATE_PATTERNS = [
-    r'\d{2,3}[가-힣]\d{4}',
-    r'[가-힣]{2}\d{2}[가-힣]\d{4}',
-    r'[A-Z]{2,3}[-\s]?\d{2,4}[-\s]?[A-Z]{0,3}',
-    r'\d{2,4}[-\s]?[A-Z]{2,3}[-\s]?\d{2,4}',
+    # 1. 신형/구형 번호판 (12가 3456, 123가 4567)
+    r'\d{2,3}[가-힣]{1}\d{4}',
+    # 2. 지역 포함 번호판 (서울 12 가 3456)
+    r'[가-힣]{2}\d{2}[가-힣]{1}\d{4}',
+    # 3. 전기차/외교/임시 등 특수 패턴 대응
+    r'[가-힣]{2,3}\d{4}', # (예: 외교 1234, 임시 1234)
+    # 4. 결합된 텍스트에서 숫자-글자-숫자 구성 포착
+    r'\d+[가-힣]+\d+',
 ]
 # 스킵할 에러 메시지

{ytcollector-1.1.1 → ytcollector-1.1.2}/ytcollector.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: ytcollector
-Version: 1.1.1
+Version: 1.1.2
 Summary: YouTube 콘텐츠 수집기 - 얼굴, 번호판, 타투, 텍스트 감지
 Author: YTCollector Team
 License: MIT
@@ -24,6 +24,7 @@ Provides-Extra: analysis
 Requires-Dist: opencv-python>=4.5.0; extra == "analysis"
 Requires-Dist: easyocr>=1.6.0; extra == "analysis"
 Requires-Dist: numpy>=1.20.0; extra == "analysis"
+Requires-Dist: ultralytics>=8.0.0; extra == "analysis"
 Provides-Extra: dev
 Requires-Dist: pytest>=7.0.0; extra == "dev"
 Requires-Dist: black>=23.0.0; extra == "dev"
@@ -46,7 +47,9 @@ pip install yt-dlp
 ### 분석 기능용 패키지 (권장)
 ```bash
-pip install opencv-python easyocr numpy
+pip install opencv-python easyocr numpy ultralytics
+# YOLO-World 기능을 사용하려면 아래 CLIP 라이브러리 수동 설치가 필요합니다.
+pip install "git+https://github.com/ultralytics/CLIP.git"
 ```
 ## 사용법
@@ -184,9 +187,9 @@ https://www.youtube.com/watch?v=aqz-KE-bpKQ, 00:10, sample_task
 | 감지 항목 | 사용 기술 | 설명 |
 |-----------|-----------|------|
 | 얼굴 | OpenCV Haar Cascade | 정면 얼굴 감지 |
-| 텍스트 | EasyOCR | 한국어/영어 문자 인식 |
-| 번호판 | EasyOCR + 정규식 | 번호판 패턴 매칭 |
-| 타투 | OpenCV HSV 분석 | 피부 영역 내 잉크 패턴 |
+| 텍스트 | EasyOCR | 한국어/영어 문자 인식 (분석 품질 및 프레임 수 개선) |
+| 번호판 | YOLO-World + OCR | YOLO-World 기반 시각적 감지 + OCR 매칭 |
+| 타투 | OpenCV HSV 분석 | 피부 영역 내 잉크 패턴 감지 |
 ## 주의사항