PyPI - deeplotx - Versions diffs - 0.2.21__py3-none-any.whl → 0.3.1__py3-none-any.whl - Mend

deeplotx 0.2.21py3-none-any.whl → 0.3.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

deeplotx/__init__.py +1 -1
deeplotx/encoder/__init__.py +1 -0
deeplotx/similarity/__init__.py +17 -0
deeplotx/similarity/distribution.py +32 -0
deeplotx/similarity/set.py +19 -0
deeplotx/similarity/vector.py +36 -0
{deeplotx-0.2.21.dist-info → deeplotx-0.3.1.dist-info}/METADATA +1 -1
{deeplotx-0.2.21.dist-info → deeplotx-0.3.1.dist-info}/RECORD +11 -7
{deeplotx-0.2.21.dist-info → deeplotx-0.3.1.dist-info}/WHEEL +0 -0
{deeplotx-0.2.21.dist-info → deeplotx-0.3.1.dist-info}/licenses/LICENSE +0 -0
{deeplotx-0.2.21.dist-info → deeplotx-0.3.1.dist-info}/top_level.txt +0 -0

deeplotx/__init__.py CHANGED Viewed

@@ -3,7 +3,7 @@ import os
 __ROOT__ = os.path.dirname(os.path.abspath(__file__))
-from .encoder import BertEncoder, LongTextEncoder
+from .encoder import BertEncoder, LongTextEncoder, LongformerEncoder
 from .nn import LinearRegression, LogisticRegression, SoftmaxRegression
 from .trainer import TextBinaryClassifierTrainer

deeplotx/encoder/__init__.py CHANGED Viewed

@@ -1,2 +1,3 @@
 from .bert_encoder import BertEncoder
 from .long_text_encoder import LongTextEncoder
+from .longformer_encoder import LongformerEncoder

deeplotx/similarity/__init__.py ADDED Viewed

@@ -0,0 +1,17 @@
+import numpy as np
+import torch
+bias = 1e-12
+def ndarray_adapter(*args) -> tuple | np.ndarray:
+    args = list(args)
+    for i, arg in enumerate(args):
+        match arg.__class__:
+            case torch.Tensor:
+                args[i] = arg.detach().cpu().numpy()
+            case List:
+                args[i] = np.asarray(arg)
+    if len(args) > 1:
+        return tuple(args)
+    return args[0]

deeplotx/similarity/distribution.py ADDED Viewed

@@ -0,0 +1,32 @@
+import numpy as np
+import torch
+from deeplotx.similarity import bias, ndarray_adapter
+def cross_entropy(p: torch.Tensor | np.ndarray, q: torch.Tensor | np.ndarray) -> np.float32:
+    p, q = ndarray_adapter(p, q)
+    q = np.clip(q, bias, 1 - bias)
+    return -1 * (np.sum(p * np.log(q)) / p.shape[0])
+def kl_divergence(p: torch.Tensor | np.ndarray, q: torch.Tensor | np.ndarray) -> np.float32:
+    p, q = ndarray_adapter(p, q)
+    q = np.where(q == 0, bias, q)
+    p = p / np.sum(p)
+    q = q / np.sum(q)
+    return np.sum(p * np.log(p / q))
+def js_divergence(p: torch.Tensor | np.ndarray, q: torch.Tensor | np.ndarray) -> np.float32:
+    p, q = ndarray_adapter(p, q)
+    m = (p + q) / 2
+    return (kl_divergence(p, m) + kl_divergence(q, m)) / 2
+def hellinger_distance(p: torch.Tensor | np.ndarray, q: torch.Tensor | np.ndarray) -> np.float32:
+    p, q = ndarray_adapter(p, q)
+    p = p / np.sum(p)
+    q = q / np.sum(q)
+    squared_diff = (np.sqrt(p) - np.sqrt(q)) ** 2
+    return np.sqrt(np.sum(squared_diff)) / np.sqrt(2)

deeplotx/similarity/set.py ADDED Viewed

@@ -0,0 +1,19 @@
+from deeplotx.similarity import bias
+def jaccard_similarity(set1: set, set2: set) -> float:
+    return (len(set1.intersection(set2)) + bias) / (len(set1.union(set2)) + bias)
+def overlap_coefficient(set1: set, set2: set) -> float:
+    return (len(set1.intersection(set2)) + bias) / (min(len(set1), len(set2)) + bias)
+def dice_coefficient(set1: set, set2: set) -> float:
+    return (2 * len(set1.intersection(set2)) + bias) / (len(set1) + len(set2) + bias)
+def ochiai_similarity(set1: set, set2: set) -> float:
+    intersection = len(set1.intersection(set2))
+    product = len(set1) ** 0.5 * len(set2) ** 0.5
+    return (intersection + bias) / (product + bias)

deeplotx/similarity/vector.py ADDED Viewed

@@ -0,0 +1,36 @@
+import numpy as np
+import torch
+from deeplotx.similarity import ndarray_adapter
+def l2_normalize(x: torch.Tensor | np.ndarray) -> np.ndarray:
+    x = ndarray_adapter(x)
+    return x / np.sqrt(np.sum(np.multiply(x, x)))
+def z_score_normalize(x: torch.Tensor | np.ndarray) -> np.ndarray:
+    x = ndarray_adapter(x)
+    mean = np.mean(x)
+    std_dev = np.std(x)
+    return (x - mean) / std_dev
+def euclidean_similarity(p: torch.Tensor | np.ndarray, q: torch.Tensor | np.ndarray) -> np.float32:
+    p, q = ndarray_adapter(p, q)
+    distance = p - q
+    distance = np.sum(np.multiply(distance, distance))
+    return np.sqrt(distance)
+def cosine_similarity(p: torch.Tensor | np.ndarray, q: torch.Tensor | np.ndarray) -> np.float32:
+    p, q = ndarray_adapter(p, q)
+    a = np.matmul(np.transpose(p), q)
+    b = np.sum(np.multiply(p, p))
+    c = np.sum(np.multiply(q, q))
+    return 1 - (a / (np.sqrt(b) * np.sqrt(c)))
+def chebyshev_similarity(p: torch.Tensor | np.ndarray, q: torch.Tensor | np.ndarray) -> np.float32:
+    p, q = ndarray_adapter(p, q)
+    return np.max(np.abs(p - q))

{deeplotx-0.2.21.dist-info → deeplotx-0.3.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: deeplotx
-Version: 0.2.21
+Version: 0.3.1
 Summary: Easy-2-use long text classifier trainers.
 Requires-Python: >=3.10
 Description-Content-Type: text/markdown

{deeplotx-0.2.21.dist-info → deeplotx-0.3.1.dist-info}/RECORD RENAMED Viewed

@@ -1,5 +1,5 @@
-deeplotx/__init__.py,sha256=Bhxc6HRnuhPZCMNlBc6oKcFTpJbWRGrZmt00vVOsNf0,916
-deeplotx/encoder/__init__.py,sha256=x7k8IE0FXvDl7kCJGWPsetOHFdvNCiCXHbYOdvo7_JQ,87
+deeplotx/__init__.py,sha256=C6N717chqnk3jqh9nuh9oM5hPldX9mCusCn-LqGWJJg,935
+deeplotx/encoder/__init__.py,sha256=EM-xrTsHoGaiiFpj-iFAxilMHXC_sQKWYrcq1qCnI3U,138
 deeplotx/encoder/bert_encoder.py,sha256=A-B7Gj94xv6UhvsFTBH7tnkAdGHRhfUZA2QjSnTKB6c,1970
 deeplotx/encoder/long_text_encoder.py,sha256=V6VxaHW6bMMaZHgU1UZ8n19UfSIV2f2sarWXquiFffQ,3018
 deeplotx/encoder/longformer_encoder.py,sha256=mZpC5TrGHQo98-ydGtVQQ9KRHgCGl1sRoxcQs7r4SSo,1409
@@ -8,14 +8,18 @@ deeplotx/nn/base_neural_network.py,sha256=Rkwu58mXXcuusf-59yLX89MywQx-EvTsSXOvlz
 deeplotx/nn/linear_regression.py,sha256=D4mEWVOq6q1Fm2otm57rgZ_E06HJLZBV5k636PprAf4,1520
 deeplotx/nn/logistic_regression.py,sha256=QAtZp2oyqOW8-1pJWVcahsSM83bzfA68EHObg-wSHHY,463
 deeplotx/nn/softmax_regression.py,sha256=eUn3mVNlye9ewVdw3McPHZuKbUvvaamsUgFIJMVMgBU,487
+deeplotx/similarity/__init__.py,sha256=JA1om2zeDcQVS1R04nDMdP6yegxdLJ14WF63pSTL3oo,418
+deeplotx/similarity/distribution.py,sha256=wQGouuuW531pZeBRKBujXsdsoz4fDnPw7_GW81jwepc,1066
+deeplotx/similarity/set.py,sha256=zhGFxtSIXlWqvipBYzoiPahp4g0boAIoUiMfG0wl07A,686
+deeplotx/similarity/vector.py,sha256=WVbDHqykt-fvuILVrhUCtIFAOEjY_zvttrXGM9eylG0,1125
 deeplotx/trainer/__init__.py,sha256=Fl5DR9UecQc5VtBcczU9sx_HtPNoFohpuELOh-Jrsks,77
 deeplotx/trainer/base_trainer.py,sha256=z0MeAT-rRYmjeBXt0ckt7J1itYArR0Cx02wHesXUoZE,385
 deeplotx/trainer/text_binary_classification_trainer.py,sha256=5O-5dwVMCj5EDX9gjJwCA468OR4UozJ7V8b-JxeUB0s,4080
 deeplotx/util/__init__.py,sha256=JxqAK_WOOHcYVSTHBT1-WuBwWrPEVDTV3titeVWvNUM,74
 deeplotx/util/hash.py,sha256=wwsC6kOQvbpuvwKsNQOARd78_wePmW9i3oaUuXRUnpc,352
 deeplotx/util/read_file.py,sha256=ptzouvEQeeW8KU5BrWNJlXw-vFXVrpS9SkAUxsu6A8A,612
-deeplotx-0.2.21.dist-info/licenses/LICENSE,sha256=IwGE9guuL-ryRPEKi6wFPI_zOhg7zDZbTYuHbSt_SAk,35823
-deeplotx-0.2.21.dist-info/METADATA,sha256=mNUcUO4dSccX1Sz8868nrbq3qWo3cINJXPVv8XtVpzY,1617
-deeplotx-0.2.21.dist-info/WHEEL,sha256=DnLRTWE75wApRYVsjgc6wsVswC54sMSJhAEd4xhDpBk,91
-deeplotx-0.2.21.dist-info/top_level.txt,sha256=hKg4pVDXZ-WWxkRfJFczRIll1Sv7VyfKCmzHLXbuh1U,9
-deeplotx-0.2.21.dist-info/RECORD,,
+deeplotx-0.3.1.dist-info/licenses/LICENSE,sha256=IwGE9guuL-ryRPEKi6wFPI_zOhg7zDZbTYuHbSt_SAk,35823
+deeplotx-0.3.1.dist-info/METADATA,sha256=GzIi1llGFDTLvHDLF3GOQ4G6MafM10M-7IeosZwZlaY,1616
+deeplotx-0.3.1.dist-info/WHEEL,sha256=DnLRTWE75wApRYVsjgc6wsVswC54sMSJhAEd4xhDpBk,91
+deeplotx-0.3.1.dist-info/top_level.txt,sha256=hKg4pVDXZ-WWxkRfJFczRIll1Sv7VyfKCmzHLXbuh1U,9
+deeplotx-0.3.1.dist-info/RECORD,,

{deeplotx-0.2.21.dist-info → deeplotx-0.3.1.dist-info}/WHEEL RENAMED Viewed

File without changes

{deeplotx-0.2.21.dist-info → deeplotx-0.3.1.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{deeplotx-0.2.21.dist-info → deeplotx-0.3.1.dist-info}/top_level.txt RENAMED Viewed

File without changes

deeplotx 0.2.21__py3-none-any.whl → 0.3.1__py3-none-any.whl

deeplotx 0.2.21py3-none-any.whl → 0.3.1py3-none-any.whl