PyPI - kmisc - Versions diffs - 2.1.121__py3-none-any.whl → 2.1.123__py3-none-any.whl - Mend

kmisc 2.1.121py3-none-any.whl → 2.1.123py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

kmisc/__init__.py CHANGED Viewed

@@ -23,12 +23,13 @@ import fnmatch
 import smtplib
 import zipfile
 import tarfile
+import warnings
 import email.utils
 from sys import modules
 from pprint import pprint
 import fcntl,socket,struct
 from email import encoders
-from threading import Thread
+from threading import Thread, Lock
 from datetime import datetime
 from http.cookies import Morsel # This module for requests when you use build by pyinstaller command
 import xml.etree.ElementTree as ET
@@ -39,6 +40,10 @@ Process=multiprocessing.Process
 Queue=multiprocessing.Queue
 #from multiprocessing import Process, Queue
 from email.mime.multipart import MIMEMultipart
+warning_message='ignore'
+warnings.filterwarnings(warning_message)
 try:
     from kmport import *
     import kmport
@@ -3448,7 +3453,7 @@ def Upper(src,default='org'):
     if default in ['org',{'org'}]: return src
     return default
-def web_capture(url,output_file,image_size='1920,1080',wait_time=3,ignore_certificate_error=False,username=None,password=None,auth_fields={'auth':{'type':'name','name':('username','password')},'submit':{'type':'submit','name':None}},next_do={}):
+def web_capture(url,output_file,image_size='1920,1080',wait_time=3,ignore_certificate_error=False,username=None,password=None,auth_fields={'auth':{'type':'name','name':('username','password')},'submit':{'type':'submit','name':None}},next_do={},gpu=False,live_capture=0,capture_method='file',capture_type='png',video_file=None,find_string=None,found_space='\n',log=None,ocr_enhance=False,daemon=False,backup=False):
     #auth_fields.submit.type : name    : login button with name
     #                        : id      : login button with id
     #                        : submit  : submit button without name or id
@@ -3458,20 +3463,36 @@ def web_capture(url,output_file,image_size='1920,1080',wait_time=3,ignore_certif
     #auth_fields.auth.name   : (usernane,password)    : username/password field string for name or id
     #next_do                 : put data and click submit
+    _url=url.split('/')
+    url=WEB().url_join(*_url[1:],method=_url[0])
     if isinstance(image_size,str):
         if 'x' in image_size:
             image_size=image_size.split('x')
         elif ',' in image_size:
             image_size=image_size.split(',')
+        elif '*' in image_size:
+            image_size=image_size.split('*')
+        elif ':' in image_size:
+            image_size=image_size.split(':')
     if isinstance(image_size,(list,tuple)) and len(image_size) == 2:
         image_size=','.join([str(i) for i in image_size])
     else:
-        #Set it to default image size
-        image_size='1920,1080'
+        if not IsIn(image_size,[None,'full','fullscreen','full_screen','auto']):
+            #Set it to default image size
+            image_size='1920,1080'
     if Import('import selenium'):
         return False,'Can not install selenium package'
     else:
+        if backup:
+            Import('filecmp')
+            Import('shutil')
+        if capture_type in ['mov','mp4']:
+            Import('cv2',install_name='opencv-python')
+        ocr=None
+        if capture_method != 'file':
+            ocr=OCR(enhance=ocr_enhance)
         # Configure Chrome options for headless mode
         from selenium.webdriver.chrome.options import Options
         from selenium.webdriver.common.by import By
@@ -3481,12 +3502,18 @@ def web_capture(url,output_file,image_size='1920,1080',wait_time=3,ignore_certif
         chrome_options.add_argument('--headless')  # Run in headless mode
         chrome_options.add_argument('--no-sandbox')
         chrome_options.add_argument('--disable-dev-shm-usage')
-        chrome_options.add_argument(f"--window-size={image_size}")  # Set window size
+        if image_size.lower() not in ['full','fullscreen','full_screen','auto']:
+            chrome_options.add_argument(f"--window-size={image_size}")  # Set window size
+        if not gpu:
+            chrome_options.add_argument("--disable-gpu")
         if ignore_certificate_error:
             chrome_options.add_argument('--ignore-certificate-errors') # gnore-certificate-errors
             chrome_options.add_argument('--allow-insecure-localhost')  # gnore-certificate-errors
         # Initialize the Chrome driver
         driver = selenium.webdriver.Chrome(options=chrome_options)
+        if image_size.lower() in ['full','fullscreen','full_screen','auto']:
+            driver.maximize_window()
         rc=False,output_file
         try:
             # Navigate to the URL
@@ -3541,20 +3568,186 @@ def web_capture(url,output_file,image_size='1920,1080',wait_time=3,ignore_certif
                     next_do_button = driver.find_element(By.XPATH, "//button[@type='submit']")
                 next_do_button.click()
-            # Wait for the page to load
-            time.sleep(wait_time)
+            def _capture_(live_capture,driver,output_file,wait_time,capture_method,backup,ocr,log,find_string,daemon,video_file):
+                def wait_body(driver,timeout=10):
+                    #wait until get screen data
+                    try:
+                        selenium.webdriver.support.ui.WebDriverWait(driver,timeout).until(
+                            EC.presence_of_element_located((By.TAG_NAME,"body"))
+                            )
+                        return
+                    except:
+                        try:
+                            selenium.webdriver.support.ui.WebDriverWait(driver,timeout).until(
+                                lambda d: d.execute_script("return document.readyState") == "complete"
+                            )
+                            return
+                        except:
+                            pass
+                    time.sleep(timeout)
+                live_capture=Int(live_capture)
+                if not isinstance(wait_time,(int,float)):
+                    wait_time=Int(wait_time,10)
+                backup_idx=0
+                if backup:
+                    backup=Int(backup,2)
+                if isinstance(live_capture,int) and live_capture > wait_time*2:
+                    #Keep capture
+                    Time=TIME()
+                    if capture_type in ['mov','mp4']:
+                        frame_rate=1/wait_time
+                        window_size = driver.get_window_size()
+                        width = window_size['width']
+                        height = window_size['height']
+                        fourcc = cv2.VideoWriter_fourcc(*'mp4v') # Codec for MP4
+                        video_writer = cv2.VideoWriter(video_file, fourcc, frame_rate, (width, height))
+                    while True:
+                        if Time.Out(live_capture):
+                            driver.quit()
+                            if capture_type in ['mov','mp4']:
+                                video_writer.release()
+                                return True
+                            else:
+                                #Do something, but not return until timeout. So return False
+                                return False
+                        # Capture screenshot
+                        if log:
+                            if IsIn(log,['screen','log','print',print]):
+                                printf(Dot(),direct=True)
+                            else:
+                                printf(Dot(),log=log,direct=True)
+                        if backup and capture_type not in ['mov','mp4']:
+                            save_file='{}.{}'.format(output_file,backup_idx%backup)
+                        else:
+                            save_file=output_file
+                        #wait
+                        wait_body(driver,timeout=wait_time)
+                        #capture
+                        driver.save_screenshot(save_file)
+                        if capture_type in ['mov','mp4']:
+                            #Make a video file
+                            frame = cv2.imread(save_file)
+                            frame = cv2.resize(frame, (width, height))
+                            video_writer.write(frame)
+                        else:
+                            #do something with picture file
+                            if backup:
+                                if backup == 2:
+                                    comp_a=f'{output_file}.0'
+                                    comp_b=f'{output_file}.1'
+                                    if os.path.isfile(comp_a) and os.path.isfile(comp_b):
+                                        if filecmp.cmp(comp_a,comp_b):
+                                            if log:
+                                                if IsIn(log,['screen','log','print',print]):
+                                                    printf(Dot(),direct=True)
+                                                else:
+                                                    printf(Dot(),log=log,direct=True)
+                                            time.sleep(wait_time)
+                                            backup_idx+=1
+                                            continue
+                                shutil.copy2(save_file,output_file)
+                            if IsIn(capture_method,['log','screen','text']):
+                                found_words=ocr.Text(image_file=save_file)
+                                found_strings=found_space.join(found_words)
+                                if IsIn(log,['screen','log','print',print,None]):
+                                    printf(found_strings,mode='s')
+                                else:
+                                    printf(found_strings,log=log,mode='d')
+                                if find_string:
+                                    if find_string in found_strings:
+                                        #Find exit string, So True, So True, So True, So True
+                                        driver.quit()
+                                        return True
+                            backup_idx+=1
+                        #capture interval
+                        time.sleep(wait_time)
+                else:
+                    #Single capture
+                    #wait
+                    #wait_body(driver,timeout=wait_time)
+                    time.sleep(wait_time)
+                    #capture
+                    driver.save_screenshot(output_file)
+                    if IsIn(capture_method,['log','screen','text']):
+                        found_words=ocr.Text(image_file=output_file)
+                        found_strings=found_space.join(found_words)
+                        if IsIn(log,['screen','log','print',print,None]):
+                            printf(found_strings,mode='s')
+                        else:
+                            printf(found_strings,log=log,mode='d')
+                        if find_string:
+                            if find_string in found_strings:
+                                driver.quit()
+                                return True
+                    driver.quit()
+                    if IsIn(capture_method,['text']):
+                        return found_strings
+                    return True
+            ##
+            if IsIn(capture_type,['mov','mp4']):
+                if not video_file:
+                    video_file='{}.mp4'.format('.'.join(output_file.split('.')[:-1]))
+            #Background running
+            if daemon:
+                t=kThread(target=_capture_, args=(live_capture,driver,output_file,wait_time,capture_method,backup,ocr,log,find_string,daemon,video_file))
+                return t
+            else:
+                #Single process running
+                rc=_capture_(live_capture,driver,output_file,wait_time,capture_method,backup,ocr,log,find_string,daemon,video_file)
+                if IsIn(capture_type,['mov','mp4']):
+                    return rc,video_file
+                else:
+                    return rc,output_file
-            # Capture screenshot
-            driver.save_screenshot(output_file)
-            #print(f"Screenshot saved to {output_file}")
-            rc=True,output_file
         except Exception as e:
             #print(f"Error capturing screenshot: {str(e)}")
-            rc=False,str(e)
-        finally:
-            # Close the browser
             driver.quit()
-        return rc
+            return False,str(e)
+#        finally:
+#            # Close the browser
+#            driver.quit()
+#        return rc
+class OCR:
+    def __init__(self,image_file=None,enhance=False,language=['en'],gpu=False,model_storage_directory=None,**opts):
+        self.enhance=enhance
+        self.image_file=image_file
+        Import('easyocr')
+        if self.enhance:
+            Import('PIL',install_name='Pillow')
+            Import('numpy')
+        self.reader = easyocr.Reader(language,gpu=gpu,model_storage_directory=model_storage_directory)
+        # Suppress Torch pin_memory warning
+        warnings.filterwarnings("ignore", category=UserWarning, module="torch.utils.data.dataloader")
+        # Suppress EasyOCR CPU warning
+        #warnings.filterwarnings("ignore", message="WARNING:easyocr.easyocr:Using CPU. Note: This module is much faster with a GPU.")
+        # Suppress NetworkX backend warning
+        warnings.filterwarnings("ignore", category=RuntimeWarning, module="networkx.utils.backends")
+    def Text(self,detail=0,low_text=None,contrast_ths=None,image_file=None):
+        if not image_file: image_file=self.image_file
+        if not image_file: return False
+        opts={}
+        opts['detail']=detail
+        if isinstance(low_text,float): opts['low_text']=low_test
+        if isinstance(contrast_ths,float): opts['contrast_ths']=contrast_ths
+        if self.enhance:
+            image = PIL.Image.open(image_file)
+            image = image.convert('L') #Grayscale
+            image = PIL.ImageEnhance.Contrast(image).enhance(3.0) #high contrast
+            image = PIL.ImageEnhance.Sharpness(image).enhance(2.0)#Sharpen
+            image = image.convert('RGB').point(lambda p: 255 if p > 140 else 0)  # Adjust threshold if needed
+#            image = image.resize((800, int(800 * image.height / image.width)), PIL.Image.Resampling.LANCZOS)
+            image.save(image_file)
+#            image_np = numpy.array(image)
+#            return self.reader.readtext(image_np,**opts)
+#        else:
+        return self.reader.readtext(image_file,**opts)
 ############################################
 #Temporary function map for replacement

{kmisc-2.1.121.dist-info → kmisc-2.1.123.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: kmisc
-Version: 2.1.121
+Version: 2.1.123
 Summary: Enginering useful library
 Home-page: https://github.com/kagepark/kmisc
 Author: Kage Park

kmisc-2.1.123.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,6 @@
+kmisc/__init__.py,sha256=pu-2QG3sY7W_Vb6eJmpo7Mytvjs4DfaJseGNJN1GmgA,160300
+kmisc-2.1.123.dist-info/LICENSE,sha256=mn9ekhb34HJxsrVhcxrLXJUzy55T62zg-Gh9Ro0mVJI,1066
+kmisc-2.1.123.dist-info/METADATA,sha256=S9rNpdC9R3EUiB9m6p-DZyZcq16Sle34LwxrSzBaYoc,5523
+kmisc-2.1.123.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
+kmisc-2.1.123.dist-info/top_level.txt,sha256=wvdHf5aQTqcGYvxk-F9E_BMWLMhlwC8INBmwO-V6_X4,6
+kmisc-2.1.123.dist-info/RECORD,,

kmisc-2.1.121.dist-info/RECORD DELETED Viewed

@@ -1,6 +0,0 @@
-kmisc/__init__.py,sha256=uXh4rvX7twUmd9o7TqICr5UCWlAa2i8kzKmpa4BpbSA,150362
-kmisc-2.1.121.dist-info/LICENSE,sha256=mn9ekhb34HJxsrVhcxrLXJUzy55T62zg-Gh9Ro0mVJI,1066
-kmisc-2.1.121.dist-info/METADATA,sha256=L084X4RVPGQGXITXXVrYSswc1agQNfiKVJRdkDu6S3s,5523
-kmisc-2.1.121.dist-info/WHEEL,sha256=eOLhNAGa2EW3wWl_TU484h7q1UNgy0JXjjoqKoxAAQc,92
-kmisc-2.1.121.dist-info/top_level.txt,sha256=wvdHf5aQTqcGYvxk-F9E_BMWLMhlwC8INBmwO-V6_X4,6
-kmisc-2.1.121.dist-info/RECORD,,

{kmisc-2.1.121.dist-info → kmisc-2.1.123.dist-info}/LICENSE RENAMED Viewed

File without changes

{kmisc-2.1.121.dist-info → kmisc-2.1.123.dist-info}/WHEEL RENAMED Viewed

File without changes

{kmisc-2.1.121.dist-info → kmisc-2.1.123.dist-info}/top_level.txt RENAMED Viewed

File without changes

kmisc 2.1.121__py3-none-any.whl → 2.1.123__py3-none-any.whl

kmisc 2.1.121py3-none-any.whl → 2.1.123py3-none-any.whl