PyPI - nlpertools - Versions diffs - 1.0.9__py3-none-any.whl → 1.0.11__py3-none-any.whl - Mend

nlpertools 1.0.9py3-none-any.whl → 1.0.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

nlpertools/__init__.py +3 -2
nlpertools/cli.py +26 -47
nlpertools/dataprocess/__init__.py +1 -0
nlpertools/dataprocess/dedupl.py +9 -0
nlpertools/{dataprocess.py → dataprocess/dp_main.py} +13 -1
nlpertools/io/dir.py +25 -5
nlpertools/io/file.py +46 -43
nlpertools/llm/__init__.py +3 -0
nlpertools/llm/call_llm_once.py +60 -0
nlpertools/llm/infer.py +119 -0
nlpertools/llm/price.py +13 -0
nlpertools/ml.py +72 -59
nlpertools/other.py +82 -53
nlpertools/utils/package.py +9 -10
nlpertools/wrapper.py +6 -4
{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info}/METADATA +27 -25
{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info}/RECORD +21 -15
{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info}/WHEEL +1 -1
{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info}/entry_points.txt +0 -0
{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info/licenses}/LICENSE +0 -0
{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info}/top_level.txt +0 -0

nlpertools/other.py CHANGED Viewed

@@ -3,7 +3,6 @@
 # @Author  : youshu.Ji
 import itertools
 import os
-import re
 import string
 import subprocess
 import threading
@@ -13,7 +12,10 @@ import math
 import datetime
 import difflib
 import psutil
+import sys
 from .io.file import writetxt_w_list, writetxt_a
 # import numpy as np
 # import psutil
 # import pyquery as pq
@@ -25,9 +27,9 @@ from .io.file import writetxt_w_list, writetxt_a
 # from win32evtlogutil import langid
 from .utils.package import *
-CHINESE_PUNCTUATION = list('，。；：‘’“”！？《》「」【】<>（）、')
-ENGLISH_PUNCTUATION = list(',.;:\'"!?<>()')
-OTHER_PUNCTUATION = list('!@#$%^&*')
+CHINESE_PUNCTUATION = list("，。；：‘’“”！？《》「」【】<>（）、")
+ENGLISH_PUNCTUATION = list(",.;:'\"!?<>()")
+OTHER_PUNCTUATION = list("!@#$%^&*")
 def setup_logging(log_file):
@@ -40,11 +42,23 @@ def setup_logging(log_file):
     logging.basicConfig(
         filename=log_file,
         level=logging.INFO,
-        format='%(asctime)s - %(levelname)s - %(message)s',
-        datefmt='%Y-%m-%d %H:%M:%S'
+        format="%(asctime)s - %(levelname)s - %(message)s",
+        datefmt="%Y-%m-%d %H:%M:%S",
     )
+def stop():
+    sys.exit()
+def exit():
+    sys.exit()
+def round2(num):
+    return round(num * 100, 2)
 def get_diff_parts(str1, str2):
     # 创建一个 SequenceMatcher 对象
     matcher = difflib.SequenceMatcher(None, str1, str2)
@@ -52,7 +66,7 @@ def get_diff_parts(str1, str2):
     # 获取差异部分
     diff_parts = []
     for tag, i1, i2, j1, j2 in matcher.get_opcodes():
-        if tag == 'replace' or tag == 'delete' or tag == 'insert':
+        if tag == "replace" or tag == "delete" or tag == "insert":
             diff_parts.append((tag, str1[i1:i2], str2[j1:j2]))
     return diff_parts
@@ -62,8 +76,9 @@ def run_cmd_with_timeout(cmd, timeout):
     """
     https://juejin.cn/post/7391703459803086848
     """
-    process = subprocess.Popen(cmd, shell=True, encoding="utf-8", errors="ignore", stdout=subprocess.PIPE,
-                               stderr=subprocess.PIPE)
+    process = subprocess.Popen(
+        cmd, shell=True, encoding="utf-8", errors="ignore", stdout=subprocess.PIPE, stderr=subprocess.PIPE
+    )
     res = [None]
     def target():
@@ -144,8 +159,11 @@ def print_three_line_table(df):
             border-bottom: (third_line_px)px solid black;
         }
     </style>"""
-    style = style.replace("(first_line_px)", first_line_px).replace("(second_line_px)", second_line_px).replace(
-        "(third_line_px)", third_line_px)
+    style = (
+        style.replace("(first_line_px)", first_line_px)
+        .replace("(second_line_px)", second_line_px)
+        .replace("(third_line_px)", third_line_px)
+    )
     # 将 CSS 样式和 HTML 表格结合起来
     html = f"{style}{html_table}"
     print(html)
@@ -153,7 +171,7 @@ def print_three_line_table(df):
     # 将 HTML 保存到文件中
     with open(temp_file_path, "w") as f:
         f.write(html)
-    webbrowser.open('file://' + os.path.realpath(temp_file_path))
+    webbrowser.open("file://" + os.path.realpath(temp_file_path))
 def jprint(obj, depth=0):
@@ -169,12 +187,16 @@ def jprint(obj, depth=0):
         print(obj)
-def print_split(sign="=", num=20):
-    print(sign * num)
+def print_split(sign="=", num=20, char: str = None):
+    if char:
+        print(sign * num // 2, char, sign * num // 2)
+    else:
+        print(sign * num)
 def seed_everything():
     import torch
     # seed everything
     seed = 7777777
     np.random.seed(seed)
@@ -189,22 +211,23 @@ def sent_email(mail_user, mail_pass, receiver, title, content, attach_path=None)
     from email.mime.text import MIMEText
     from email.mime.application import MIMEApplication
-    mail_host = 'smtp.qq.com'
+    mail_host = "smtp.qq.com"
     mail_user = mail_user
     mail_pass = mail_pass
     sender = mail_user
     message = MIMEMultipart()
-    message.attach(MIMEText(content, 'plain', 'utf-8'))
+    message.attach(MIMEText(content, "plain", "utf-8"))
     if attach_path:
-        attachment = MIMEApplication(open(attach_path, 'rb').read())
-        attachment["Content-Type"] = 'application/octet-stream'
-        attachment.add_header('Content-Dispositon', 'attachment',
-                              filename=('utf-8', '', attach_path))  # 注意：此处basename要转换为gbk编码，否则中文会有乱码。
+        attachment = MIMEApplication(open(attach_path, "rb").read())
+        attachment["Content-Type"] = "application/octet-stream"
+        attachment.add_header(
+            "Content-Dispositon", "attachment", filename=("utf-8", "", attach_path)
+        )  # 注意：此处basename要转换为gbk编码，否则中文会有乱码。
         message.attach(attachment)
-    message['Subject'] = title
-    message['From'] = sender
-    message['To'] = receiver
+    message["Subject"] = title
+    message["From"] = sender
+    message["To"] = receiver
     try:
         smtp_obj = smtplib.SMTP()
@@ -212,9 +235,9 @@ def sent_email(mail_user, mail_pass, receiver, title, content, attach_path=None)
         smtp_obj.login(mail_user, mail_pass)
         smtp_obj.sendmail(sender, receiver, message.as_string())
         smtp_obj.quit()
-        print('send email success')
+        print("send email success")
     except smtplib.SMTPException as e:
-        print('send failed', e)
+        print("send failed", e)
 def convert_np_to_py(obj):
@@ -244,12 +267,12 @@ def camel_to_snake(s: str) -> str:
     :param s: camel case variable
     :return:
     """
-    return reduce(lambda x, y: x + ('_' if y.isupper() else '') + y, s).lower()
+    return reduce(lambda x, y: x + ("_" if y.isupper() else "") + y, s).lower()
 # other ----------------------------------------------------------------------
 # 统计词频
-def calc_word_count(list_word, mode, path='tempcount.txt', sort_id=1, is_reverse=True):
+def calc_word_count(list_word, mode, path="tempcount.txt", sort_id=1, is_reverse=True):
     word_count = {}
     for key in list_word:
         if key not in word_count:
@@ -257,20 +280,20 @@ def calc_word_count(list_word, mode, path='tempcount.txt', sort_id=1, is_reverse
         else:
             word_count[key] += 1
     word_dict_sort = sorted(word_count.items(), key=lambda x: x[sort_id], reverse=is_reverse)
-    if mode == 'w':
+    if mode == "w":
         for key in word_dict_sort:
-            writetxt_a(str(key[0]) + '\t' + str(key[1]) + '\n', path)
-    elif mode == 'p':
+            writetxt_a(str(key[0]) + "\t" + str(key[1]) + "\n", path)
+    elif mode == "p":
         for key in word_dict_sort:
-            print(str(key[0]) + '\t' + str(key[1]))
-    elif mode == 'u':
+            print(str(key[0]) + "\t" + str(key[1]))
+    elif mode == "u":
         return word_dict_sort
 # 字典去重
 def dupl_dict(dict_list, key):
     new_dict_list, value_set = [], []
-    print('去重中...')
+    print("去重中...")
     for i in tqdm(dict_list):
         if i[key] not in value_set:
             new_dict_list.append(i)
@@ -285,9 +308,9 @@ def multi_thread_run(_task, data):
 def del_special_char(sentence):
-    special_chars = ['\ufeff', '\xa0', '\u3000', '\xa0', '\ue627']
+    special_chars = ["\ufeff", "\xa0", "\u3000", "\xa0", "\ue627"]
     for i in special_chars:
-        sentence = sentence.replace(i, '')
+        sentence = sentence.replace(i, "")
     return sentence
@@ -303,20 +326,20 @@ def spider(url):
     :param url:
     :return:
     """
-    if 'baijiahao' in url:
+    if "baijiahao" in url:
         content = requests.get(url)
         # print(content.text)
         html = pq.PyQuery(content.text)
-        title = html('.index-module_articleTitle_28fPT').text()
-        res = html('.index-module_articleWrap_2Zphx').text().rstrip('举报/反馈')
-        return '{}\n{}'.format(title, res)
+        title = html(".index-module_articleTitle_28fPT").text()
+        res = html(".index-module_articleWrap_2Zphx").text().rstrip("举报/反馈")
+        return "{}\n{}".format(title, res)
 def eda(sentence):
-    url = 'https://x.x.x.x:x/eda'
+    url = "https://x.x.x.x:x/eda"
     json_data = dict({"sentence": sentence})
     res = requests.post(url, json=json_data)
-    return res.json()['eda']
+    return res.json()["eda"]
 def find_language(text):
@@ -350,8 +373,8 @@ def print_prf(y_true, y_pred, label=None):
     for i in range(len(label)):
         res = []
         for k in result:
-            res.append('%.5f' % k[i])
-        print('{}: {} {} {}'.format(label[i], *res[:3]))
+            res.append("%.5f" % k[i])
+        print("{}: {} {} {}".format(label[i], *res[:3]))
 def print_cpu():
@@ -372,14 +395,16 @@ def squeeze_list(high_dim_list):
 def unsqueeze_list(flatten_list, each_element_len):
     # 该函数是错的，被split_list替代了
-    two_dim_list = [flatten_list[i * each_element_len:(i + 1) * each_element_len] for i in
-                    range(len(flatten_list) // each_element_len)]
+    two_dim_list = [
+        flatten_list[i * each_element_len : (i + 1) * each_element_len]
+        for i in range(len(flatten_list) // each_element_len)
+    ]
     return two_dim_list
 def split_list(input_list, chunk_size):
     # 使用列表推导式将列表分割成二维数组
-    return [input_list[i:i + chunk_size] for i in range(0, len(input_list), chunk_size)]
+    return [input_list[i : i + chunk_size] for i in range(0, len(input_list), chunk_size)]
 def auto_close():
@@ -389,6 +414,7 @@ def auto_close():
     import pyautogui as pg
     import time
     import os
     cmd = 'schtasks /create /tn shut /tr "shutdown -s -f" /sc once /st 23:30'
     os.system(cmd)
     while 1:
@@ -402,10 +428,13 @@ def tf_idf(corpus, save_path):
     vectorizer = CountVectorizer()  # 该类会将文本中的词语转换为词频矩阵，矩阵元素a[i][j] 表示j词在i类文本下的词频
     transformer = TfidfTransformer()  # 该类会统计每个词语的tf-idf权值
     tfidf = transformer.fit_transform(
-        vectorizer.fit_transform(corpus))  # 第一个fit_transform是计算tf-idf，第二个fit_transform是将文本转为词频矩阵
+        vectorizer.fit_transform(corpus)
+    )  # 第一个fit_transform是计算tf-idf，第二个fit_transform是将文本转为词频矩阵
     word = vectorizer.get_feature_names()  # 获取词袋模型中的所有词语
     weight = tfidf.toarray()  # 将tf-idf矩阵抽取出来，元素a[i][j]表示j词在i类文本中的tf-idf权重
-    for i in range(len(weight)):  # 打印每类文本的tf-idf词语权重，第一个for遍历所有文本，第二个for便利某一类文本下的词语权重
+    for i in range(
+        len(weight)
+    ):  # 打印每类文本的tf-idf词语权重，第一个for遍历所有文本，第二个for便利某一类文本下的词语权重
         for j in range(len(word)):
             getword = word[j]
             getvalue = weight[i][j]
@@ -415,7 +444,7 @@ def tf_idf(corpus, save_path):
                 else:
                     tfidfdict.update({getword: getvalue})
     sorted_tfidf = sorted(tfidfdict.items(), key=lambda d: d[1], reverse=True)
-    to_write = ['{} {}'.format(i[0], i[1]) for i in sorted_tfidf]
+    to_write = ["{} {}".format(i[0], i[1]) for i in sorted_tfidf]
     writetxt_w_list(to_write, save_path, num_lf=1)
@@ -424,7 +453,7 @@ class GaussDecay(object):
     当前只实现了时间的，全部使用默认值
     """
-    def __init__(self, origin='2022-08-02', scale='90d', offset='5d', decay=0.5, task="time"):
+    def __init__(self, origin="2022-08-02", scale="90d", offset="5d", decay=0.5, task="time"):
         self.origin = origin
         self.task = task
         self.scale, self.offset = self.translate(scale, offset)
@@ -448,7 +477,7 @@ class GaussDecay(object):
     @staticmethod
     def translated_minus(field_value):
         origin = datetime.datetime.now()
-        field_value = datetime.datetime.strptime(field_value, '%Y-%m-%d %H:%M:%S')
+        field_value = datetime.datetime.strptime(field_value, "%Y-%m-%d %H:%M:%S")
         return (origin - field_value).days
     def calc_exp(self):
@@ -466,13 +495,13 @@ class GaussDecay(object):
         :return:
         """
         numerator = max(0, (abs(self.translated_minus(field_value)) - self.offset)) ** 2
-        sigma_square = -1 * self.scale ** 2 / (2 * math.log(self.decay, math.e))
+        sigma_square = -1 * self.scale**2 / (2 * math.log(self.decay, math.e))
         denominator = 2 * sigma_square
         s = math.exp(-1 * numerator / denominator)
         return round(self.time_coefficient * s + self.related_coefficient * raw_score, 7)
-if __name__ == '__main__':
+if __name__ == "__main__":
     gauss_decay = GaussDecay()
     res = gauss_decay.calc_gauss(raw_score=1, field_value="2021-05-29 14:31:13")
     print(res)

nlpertools/utils/package.py CHANGED Viewed

@@ -37,20 +37,19 @@ def lazy_import(importer_name, to_import):
     module = importlib.import_module(importer_name)
     import_mapping = {}
     for name in to_import:
-        importing, _, binding = name.partition(' as ')
+        importing, _, binding = name.partition(" as ")
         if not binding:
-            _, _, binding = importing.rpartition('.')
+            _, _, binding = importing.rpartition(".")
         import_mapping[binding] = importing
     def __getattr__(name):
         if name not in import_mapping:
-            message = f'module {importer_name!r} has no attribute {name!r}'
+            message = f"module {importer_name!r} has no attribute {name!r}"
             raise AttributeError(message)
         importing = import_mapping[name]
         # imortlib.import_module() implicitly sets submodules on this module as
         # appropriate for direct imports.
-        imported = importlib.import_module(importing,
-                                           module.__spec__.parent)
+        imported = importlib.import_module(importing, module.__spec__.parent)
         setattr(module, name, imported)
         return imported
@@ -75,15 +74,15 @@ KafkaConsumer = try_import("kafka", "KafkaConsumer")
 np = try_import("numpy", None)
 plt = try_import("matplotlib", "pyplot")
 WordNetLemmatizer = try_import("nltk.stem", "WordNetLemmatizer")
-metrics = try_import("sklearn", "metrics")
+# metrics = try_import("sklearn", "metrics")
 requests = try_import("requests", None)
 pq = try_import("pyquery", None)
-CountVectorizer = try_import("sklearn.feature_extraction.text", "CountVectorizer")
-precision_recall_fscore_support = try_import("sklearn.metrics", "precision_recall_fscore_support")
+# CountVectorizer = try_import("sklearn.feature_extraction.text", "CountVectorizer")
+# precision_recall_fscore_support = try_import("sklearn.metrics", "precision_recall_fscore_support")
 tqdm = try_import("tqdm", "tqdm")
 # TODO 自动导出langid和win32evtlogutil输出有bug
 langid = try_import("langid", None)
 win32evtlogutil = try_import("win32evtlogutil", None)
-TfidfTransformer = try_import("sklearn.feature_extraction.text", "TfidfTransformer")
+# TfidfTransformer = try_import("sklearn.feature_extraction.text", "TfidfTransformer")
 yaml = try_import("yaml", None)
-omegaconf = try_import("omegaconf", None)
+omegaconf = try_import("omegaconf", None)

nlpertools/wrapper.py CHANGED Viewed

@@ -7,16 +7,18 @@ import time
 from functools import wraps
 import asyncio
 def fn_async_timer(function):
     """
     针对异步函数的装饰器
     """
     @wraps(function)
     async def function_timer(*args, **kwargs):
         t0 = time.time()
         result = await function(*args, **kwargs)
         t1 = time.time()
-        print('[finished {func_name} in {time:.2f}s]'.format(func_name=function.__name__, time=t1 - t0))
+        print("[finished {func_name} in {time:.2f}s]".format(func_name=function.__name__, time=t1 - t0))
         return result
     return function_timer
@@ -36,14 +38,14 @@ def fn_timer(async_func=False, analyse=False):
             t0 = time.time()
             result = await asyncio.create_task(func(*args, **kwargs))
             t1 = time.time()
-            print('[finished {func_name} in {time:.2f}s]'.format(func_name=func.__name__, time=t1 - t0))
+            print("[finished {func_name} in {time:.2f}s]".format(func_name=func.__name__, time=t1 - t0))
             return result
         def func_time(*args, **kwargs):
             t0 = time.time()
             result = func(*args, **kwargs)
             t1 = time.time()
-            print('[finished {func_name} in {time:.2f}s]'.format(func_name=func.__name__, time=t1 - t0))
+            print("[finished {func_name} in {time:.2f}s]".format(func_name=func.__name__, time=t1 - t0))
             return result
         def func_time_analyse(*args, **kwargs):
@@ -114,7 +116,7 @@ def fn_try(parameter):
                 return result
             except Exception as e:
                 msg = "报错！"
-                print('[func_name: {func_name} {msg}]'.format(func_name=function.__name__, msg=msg))
+                print("[func_name: {func_name} {msg}]".format(func_name=function.__name__, msg=msg))
                 parameter["msg"] = parameter["msg"].format(str(e))
                 return parameter
             finally:

{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
-Metadata-Version: 2.2
+Metadata-Version: 2.4
 Name: nlpertools
-Version: 1.0.9
+Version: 1.0.11
 Summary: A small package about small basic IO operation when coding
 Home-page: https://github.com/lvzii/nlpertools
 Author: youshuJi
@@ -15,8 +15,10 @@ License-File: LICENSE
 Requires-Dist: numpy
 Requires-Dist: pandas
 Requires-Dist: psutil
+Requires-Dist: openai
 Provides-Extra: torch
 Requires-Dist: torch; extra == "torch"
+Dynamic: license-file
 Dynamic: provides-extra
 Dynamic: requires-dist
@@ -50,6 +52,25 @@ nlpertools
 ```
+# 最常用/喜欢的功能（使用示例）
+```python
+# 读txt, json文件
+import nlpertools
+txt_data = nlpertools.readtxt_list_all_strip('res.txt')
+json_data = nlpertools.load_from_json('res.json')
+```
+```bash
+## git, 连接github不稳定的时候非常有用
+ncli git pull
+## 带有参数时，加上--以避免-u被解析
+ncli -- git push -u origin main
+# 生成pypi双因素认证的实时密钥(需要提供key)
+ncli --get_2fa --get_2fa_key your_key
+```
 # 安装
 Install the latest release version
@@ -101,30 +122,7 @@ https://nlpertools.readthedocs.io/en/latest/
 一些可能需要配置才能用的函数，写上示例
-## 使用示例
-```python
-import nlpertools
-a = nlpertools.readtxt_list_all_strip('res.txt')
-# 或
-b = nlpertools.io.file.readtxt_list_all_strip('res.txt')
-```
-```bash
-# 生成pypi双因素认证的实时密钥(需要提供key)
-python -m nlpertools.cli --get_2fa --get_2fa_key your_key
-## git
-python -m nlpertools.cli --git_push
-python -m nlpertools.cli --git_pull
-# 以下功能被nvitop替代，不推荐使用
-## 监控gpu显存
-python -m nlpertools.monitor.gpu
-## 监控cpu
-python -m  nlpertools.monitor.memory
-```
 ## 一些常用项目
@@ -132,3 +130,7 @@ nvitop
 ydata-profiling
+## 贡献
+https://github.com/bigscience-workshop/data-preparation

{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info}/RECORD RENAMED Viewed

@@ -1,20 +1,19 @@
-nlpertools/__init__.py,sha256=5ka-NeGW2AUDJ4YZ12DD64xcxuxf9PlQUurxDp5DHbQ,483
-nlpertools/cli.py,sha256=4Ik1NyFaoZpZLsYLAFRLk6xuYQk0IvexPr1Ieq08viE,3932
+nlpertools/__init__.py,sha256=VnH7GWVSTcV010_kD4VtsOAwIjzhe8prax8Wj17uc20,537
+nlpertools/cli.py,sha256=uCIUkiBXqTWJaxSQd5MlliGcTfxWzymo1UyQ3z_uhak,3612
 nlpertools/data_client.py,sha256=esX8lUQrTui4uVkqPfhpHVok7Eq6ywpuemKjLeqoglc,14674
-nlpertools/dataprocess.py,sha256=v1mobuYN7I3dT6xIKlNOHVtcg31YtjF6FwNPTxeBFFY,23153
 nlpertools/default_db_config.yml,sha256=E1K9k_xzXVlsf-HJQh8kyHXHYuvTpD12jD4Hfe5rUk8,606
 nlpertools/get_2fa.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-nlpertools/ml.py,sha256=qhUBCLuHfcFy8g5ZHNGYq4eH2vYWiGetyKucv8n60-A,18523
+nlpertools/ml.py,sha256=fjI-WMM1lRnOnRFfTLEGplUx_Uamgr2gfmoAvGlgF7E,18994
 nlpertools/movie.py,sha256=rkyOnAXdsbWfMSbi1sE1VNRT7f66Hp9BnZsN_58Afmw,897
 nlpertools/nlpertools_config.yml,sha256=ksXejxFs7pxR47tNAsrN88_4gvq9PCA2ZMO07H-dJXY,26
 nlpertools/open_api.py,sha256=uyTY00OUlM57Cn0Wm0yZXcIS8vAszy9rKnDMBEWfWJM,1744
-nlpertools/other.py,sha256=JWJiXHRI8mhiUV3k4CZ4kQQS9QN3mw67SmGgTqZFtjs,15026
+nlpertools/other.py,sha256=LaNZRQ8wWJqZP6Gycq7eThEqcGXIANg7WzT6nh5QiKQ,15262
 nlpertools/pic.py,sha256=13aaFJh3USGYGs4Y9tAKTvWjmdQR4YDjl3LlIhJheOA,9906
 nlpertools/plugin.py,sha256=LB7j9GdoQi6TITddH-6EglHlOa0WIHLUT7X5vb_aIZY,1168
 nlpertools/reminder.py,sha256=wiXwZQmxMck5vY3EvG8_oakP3FAdjGTikAIOiTPUQrs,2977
 nlpertools/utils_for_nlpertools.py,sha256=SJqjfMc2Vd8ZCqzQiJCkSxjJxEKzvEUgAgbhKPtC6ww,3583
 nlpertools/vector_index_demo.py,sha256=CSCzXD13bUIo9AG-bjen668H10B02HFU1Kbxakvrs68,2924
-nlpertools/wrapper.py,sha256=xQ7UUAAqSEaRJweoZyGSTjM4B3FQNLl5Gou968Sl_hA,4348
+nlpertools/wrapper.py,sha256=8ReHv7LrBGX6wHma8rf_EhFPg0FJNoDjbn4p0O2UHzs,4350
 nlpertools/algo/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nlpertools/algo/ac.py,sha256=4BSiJdG8-S78w_KRqvGOkYjxuTDRiBsskRv-6Doi7oE,422
 nlpertools/algo/bit_ops.py,sha256=l14-j5VOqrab80CA_uBs1AiAJbzJUJH9dJXc7O9F5d0,501
@@ -24,12 +23,19 @@ nlpertools/algo/template.py,sha256=9vsHr4g3jZZ5KVU_2I9i97o8asRXq-8pSaCXIv0sHeM,2
 nlpertools/algo/union.py,sha256=0l7lGZbw1qIfW1z5TE8Oo3tybL1bKIP5rzpa5ZT-vLQ,249
 nlpertools/data_structure/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nlpertools/data_structure/base_structure.py,sha256=gVUvJZ5jsCAswRETTpMwcEjLKoageWiTuCKNEwIWKWk,2641
+nlpertools/dataprocess/__init__.py,sha256=YPBPsZ8vAoMS6GJ7GlCqj01Cx1q8dDARc_gW-ysORyk,21
+nlpertools/dataprocess/dedupl.py,sha256=WIBOrM6LfX3txcDa0xF7rqeBIpfqwrDBgepa6bavpt0,289
+nlpertools/dataprocess/dp_main.py,sha256=iyDsmKzUx5lD8EUNwkWIlTGKVQQDVx8p3pXFv2_kR64,23452
 nlpertools/draw/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nlpertools/draw/draw.py,sha256=19dskkr0wrgczxPJnphEszliwYshEh5SjD8Zz07nlk0,2615
 nlpertools/draw/math_func.py,sha256=0NQ22Dfi9DFG6Bg_hXnCT27w65-dqpOOIgZX7oUIW-Q,881
 nlpertools/io/__init__.py,sha256=YMuKtC2Ddh5dL5MvXjyUKYOOuqzFYUhBPFaP2kyFG9I,68
-nlpertools/io/dir.py,sha256=FPY62COQN8Ji72pk0dYRoXkrORYaUlybKNcL4474uUI,2263
-nlpertools/io/file.py,sha256=mLWl09IEi0rWPN4tTq3LwdYMvAjj4e_QsjEMhufuPPo,7192
+nlpertools/io/dir.py,sha256=jpJuCwLeBInr03iCSUfffmlchWShZ2Cjq38n0D0dILI,3106
+nlpertools/io/file.py,sha256=NF1xV5iazl86-TDdMQJ-LLrqCnuW29uuFb_NA55YNr4,7274
+nlpertools/llm/__init__.py,sha256=SdbGjzhu1lCeq55mC0tgsah9yzVxvvNrWMf2z8kDEoQ,71
+nlpertools/llm/call_llm_once.py,sha256=W0J2Ab8dHnVZ8q_KgfTKbee7NlJnA-ewjsne80ALLXY,1793
+nlpertools/llm/infer.py,sha256=q7asgwdJwo27d6rdBNQLys_bPEF0g-UNDKjt3S-Ltvs,4133
+nlpertools/llm/price.py,sha256=8zzEaLrbGiDUbTFSnuBGAduiSfDVXQUk4Oc_lE6eJFw,544
 nlpertools/monitor/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nlpertools/monitor/gpu.py,sha256=M59O6i0hlew7AzXZlaVZqbZA5IR93OhBY2WI0-T_HtY,531
 nlpertools/monitor/memory.py,sha256=9t6q9BC8VVx4o3G4sBCn7IoQRx272zMPjSnL3yvTBAQ,657
@@ -37,13 +43,13 @@ nlpertools/template/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSu
 nlpertools/utils/__init__.py,sha256=YMuKtC2Ddh5dL5MvXjyUKYOOuqzFYUhBPFaP2kyFG9I,68
 nlpertools/utils/lazy.py,sha256=SAeHLjxsYhpKWvcQKjs2eY0Nn5n3CJlqtxOLVOe1WjQ,29280
 nlpertools/utils/log_util.py,sha256=ftJDoTOtroLH-LadOygZljeyltOQn0D2Xb5x7Td1Qdg,428
-nlpertools/utils/package.py,sha256=wLg_M8j7Y6ReRjWHWCWoZJHrzEwuAr9TyG2jvb7OQCo,3261
+nlpertools/utils/package.py,sha256=8TLbrD3nmukpJw9lSpHHbUYK74qyAaSM_jUrCJOG6mo,3227
 nlpertools/utils/package_v1.py,sha256=sqgFb-zbTdMd5ziJLY6YUPqR49qUNZjxBH35DnyR5Wg,3542
 nlpertools/utils/package_v2.py,sha256=WOcsguWfUd4XSAfmPgCtL8HtUbqJ6GRSMHb0OsB47r0,3932
+nlpertools-1.0.11.dist-info/licenses/LICENSE,sha256=SBcMozykvTbZJ--MqSiKUmHLLROdnr25V70xCQgEwqw,11331
 nlpertools_helper/__init__.py,sha256=obxRUdZDctvcvK_iA1Dx2HmQFMlMzJto-xDPryq1lJ0,198
-nlpertools-1.0.9.dist-info/LICENSE,sha256=SBcMozykvTbZJ--MqSiKUmHLLROdnr25V70xCQgEwqw,11331
-nlpertools-1.0.9.dist-info/METADATA,sha256=lcKmxc7_mtYH47mPj8UHOM8-5T5YtrDwhHWVZkfHZXU,3330
-nlpertools-1.0.9.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
-nlpertools-1.0.9.dist-info/entry_points.txt,sha256=XEazQ4vUwJMoMAgAwk1Lq4PRQGklPkPBaFkiP0zN_JE,45
-nlpertools-1.0.9.dist-info/top_level.txt,sha256=_4q4MIFvMr4cAUbhWKWYdRXIXsF4PJDg4BUsZvgk94s,29
-nlpertools-1.0.9.dist-info/RECORD,,
+nlpertools-1.0.11.dist-info/METADATA,sha256=3KXxqbO2wWDMXLmnZJm2RvETybvIMekPelhSxE_ovKk,3386
+nlpertools-1.0.11.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+nlpertools-1.0.11.dist-info/entry_points.txt,sha256=XEazQ4vUwJMoMAgAwk1Lq4PRQGklPkPBaFkiP0zN_JE,45
+nlpertools-1.0.11.dist-info/top_level.txt,sha256=_4q4MIFvMr4cAUbhWKWYdRXIXsF4PJDg4BUsZvgk94s,29
+nlpertools-1.0.11.dist-info/RECORD,,

{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info}/WHEEL RENAMED Viewed

@@ -1,5 +1,5 @@
 Wheel-Version: 1.0
-Generator: setuptools (75.8.0)
+Generator: setuptools (80.9.0)
 Root-Is-Purelib: true
 Tag: py3-none-any

{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info/licenses}/LICENSE RENAMED Viewed

File without changes

{nlpertools-1.0.9.dist-info → nlpertools-1.0.11.dist-info}/top_level.txt RENAMED Viewed

File without changes

nlpertools 1.0.9__py3-none-any.whl → 1.0.11__py3-none-any.whl

nlpertools 1.0.9py3-none-any.whl → 1.0.11py3-none-any.whl