PyPI - datamuse - Versions diffs - 0.2.0__tar.gz → 0.3.0__tar.gz - Mend

datamuse 0.2.0tar.gz → 0.3.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

{datamuse-0.2.0 → datamuse-0.3.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: datamuse
-Version: 0.2.0
+Version: 0.3.0
 Summary: datamuse is a simple wrapper around the datamuse api https://www.datamuse.com/api/
 Author-email: Bivas Kumar <thetrotfreak@yahoo.com>
 License-Expression: MIT

datamuse-0.3.0/datamuse/annotations.py ADDED Viewed

@@ -0,0 +1,101 @@
+from enum import StrEnum
+from types import MappingProxyType
+from typing import Literal, LiteralString, NotRequired, TypeAlias, TypedDict
+Word: TypeAlias = LiteralString
+RelatedWordCode = Literal[
+    "nouns_adjective",
+    "adjectives_noun",
+    "synonyms",
+    "triggers",
+    "antonyms",
+    "hypernyms",
+    "hyponyms",
+    "holonyms",
+    "meronyms",
+    "frequent_followers",
+    "frequent_predecessors",
+    "homophones",
+    "consonant",
+]
+_lookup_related_code = MappingProxyType(
+    {
+        "nouns_adjective": "jja",
+        "adjectives_noun": "jjb",
+        "synonyms": "syn",
+        "triggers": "trg",
+        "antonyms": "ant",
+        "hypernyms": "spc",
+        "hyponyms": "gen",
+        "holonyms": "com",
+        "meronyms": "par",
+        "frequent_followers": "bga",
+        "frequent_predecessors": "bgb",
+        "homophones": "hom",
+        "consonant": "cns",
+    }
+)
+MetadataFlag = Literal[
+    "definitions",
+    "parts_of_speech",
+    "syllable_count",
+]
+_lookup_metadata_flag = MappingProxyType(
+    {
+        "definitions": "d",
+        "parts_of_speech": "p",
+        "syllable_count": "s",
+    }
+)
+class WordRelation(StrEnum):
+    """
+    When paired with a `Word`, the `Word` will be in a predefined lexical relation.
+    """
+    nouns_adjective = "jja"
+    adjectives_noun = "jjb"
+    synonyms = "syn"
+    triggers = "trg"
+    antonyms = "ant"
+    hypernyms = "spc"
+    hyponyms = "gen"
+    holonyms = "com"
+    meronyms = "par"
+    frequent_followers = "bga"
+    frequent_predecessors = "bgb"
+    homophones = "hom"
+    consonant = "cns"
+class WordMetadata(StrEnum):
+    """
+    Extra lexical knowledge for a `Word`
+    """
+    definitions = "d"
+    parts_of_speech = "p"
+    syllable_count = "s"
+class WordObject(TypedDict):
+    """
+    Representation of a word from the Datamuse API
+    """
+    word: Word
+    defs: NotRequired[list[str]]
+    tags: NotRequired[list[str]]
+    numSyllables: NotRequired[int]
+WordArray: TypeAlias = list[WordObject]

datamuse-0.3.0/datamuse/datamuse.py ADDED Viewed

@@ -0,0 +1,199 @@
+import functools
+from types import MappingProxyType
+from typing import Any, final
+import certifi
+import urllib3
+from datamuse.annotations import (
+    MetadataFlag,
+    RelatedWordCode,
+    Word,
+    WordArray,
+    WordObject,
+    _lookup_metadata_flag,
+    _lookup_related_code,
+)
+@final
+class Datamuse:
+    """
+    The [Datamuse API](https://www.datamuse.com/api/) is a word-finding query engine for developers.
+    Use it in your apps to find words that match a given set of constraints and that are likely in a given context.
+    Specify a wide variety of constraints on meaning, spelling, sound, and vocabulary in your queries, in any combination.
+    """
+    __API_URL = "api.datamuse.com"
+    __slots__ = ("__pool", "__metadata_flags", "__metadata", "_metadata")
+    def __init__(self) -> None:
+        self.__pool = urllib3.HTTPSConnectionPool(
+            host=self.__API_URL,
+            port=443,
+            cert_reqs="CERT_REQUIRED",
+            ca_certs=certifi.where(),
+        )
+        self.__metadata_flags: dict[str, str] = {}
+        self.__metadata: dict[str, dict[str, Any]] = {}
+        self._metadata = MappingProxyType(self.__metadata)
+    @property
+    def metadata(self):
+        """
+        A mapping of a word to its metadata.
+        """
+        return self._metadata
+    def _get_words(self, **kwds: Word):
+        parsed = self.__get("/words", **kwds, **self.__metadata_flags)
+        self.__metadata_flags.clear()
+        return parsed
+    def _get_suggestions(self, **kwds: Word):
+        parsed = self.__get("/sug", **kwds, **self.__metadata_flags)
+        self.__metadata_flags.clear()
+        return parsed
+    @functools.lru_cache
+    def __get(self, url: str, **kwds: Word) -> list[Word]:
+        json_response = self.__pool.request(method="GET", url=url, fields=kwds).json()
+        words = self._make_metadata(json_response)
+        return words or [obj["word"] for obj in json_response]
+    def _make_metadata(self, json_response: WordArray) -> list[Word]:
+        """
+        Builds a `metadata` dict by parsing the JSON Reponse, returing a flattened list of string.
+        The `metadata` is updated per parsing.
+        The keys may not be same across parsing since it depends on the
+        metdata flags with which the API call was made.
+        :param json_response: The json response from the datamuse api
+        :type json_response: WordArray
+        :return: A flattened list of string
+        :rtype: list[Word]
+        """
+        words = []
+        if self.__metadata_flags:
+            flags = self.__metadata_flags["md"]
+            for obj in json_response:
+                word = obj["word"]
+                words.append(word)
+                if word not in self.__metadata:
+                    self.__metadata[word] = {}
+                for f in flags:
+                    match f:
+                        case "d":
+                            self._make_definitions(obj)
+                        case "p":
+                            self._make_parts_of_speech(obj)
+                        case "s":
+                            self._make_syllable_count(obj)
+                        case "_":  # pragma: no cover
+                            # TODO: support remaining documenetd metadata flags
+                            continue
+        return words
+    def _make_definitions(self, obj: WordObject, /):
+        # TODO: what is the `defHeadWord` in api response?
+        self.__metadata[obj["word"]].update(
+            definitions=list(map(str.expandtabs, obj.get("defs", [])))
+        )
+    def _make_syllable_count(self, obj: WordObject, /):
+        self.__metadata[obj["word"]].update(syllable_count=obj.get("numSyllables", 0))
+    def _make_parts_of_speech(self, obj: WordObject, /):
+        self.__metadata[obj["word"]].update(parts_of_speech=[])
+        for t in obj.get("tags", []):
+            match t:
+                case "n":
+                    self.__metadata[obj["word"]]["parts_of_speech"].append("noun")
+                case "v":
+                    self.__metadata[obj["word"]]["parts_of_speech"].append("verb")
+                case "adj":
+                    self.__metadata[obj["word"]]["parts_of_speech"].append("adjective")
+                case "adv":
+                    self.__metadata[obj["word"]]["parts_of_speech"].append("adverb")
+                case _:
+                    pass
+    def synonyms(self, ml: Word):
+        """
+        words with a meaning similar to `ml`
+        :param ml: means like
+        """
+        return self._get_words(ml=ml)
+    def associations(self, ml: Word, start: Word = "*", end: Word = "*"):
+        """
+        words related to `ml`
+        :param ml: means like
+        :param start: start with
+        :param end: end in
+        """
+        return self._get_words(ml=ml, sp=start + end)
+    def homophones(self, sl: Word):
+        """
+        words that sound like `sl`
+        :param sl: sounds like
+        """
+        return self._get_words(sl=sl)
+    def pattern(self, start: Word, end: Word, letters: int):
+        """
+        words that start with `start`, end in `end`, and have `letters` in between
+        :param start: start with
+        :param end: end in
+        :param letters: letters in between
+        """
+        return self._get_words(sp=f"{start[0]}{'?' * letters}{end[0]}")
+    def orthographic_neighbours(self, sp: Word):
+        """
+        words that are spelled similarly to `sp`
+        :param sp: spelled like
+        """
+        return self._get_words(sp=sp)
+    def related(self, word: Word, rel: RelatedWordCode):
+        """
+        words that are related by `rel`
+        :param word: the word
+        :param rel: related word
+        """
+        return self._get_words(**{f"rel_{_lookup_related_code[rel]}": word})  # pyright: ignore[reportArgumentType]
+    def suggestions(self, s: Word):
+        """
+        sugesstions from prefix hint string `s`
+        :param s: prefix hint string
+        """
+        return self._get_suggestions(s=s)
+    def with_metadata(self, *md: MetadataFlag):
+        """
+        Include extra lexical knowledge for a `Word`.
+        Accessible through the `metadata` property.
+        :param md: the metadata
+        """
+        self.__metadata_flags.update(
+            md="".join({_lookup_metadata_flag[meta] for meta in md})
+        )
+        return self

{datamuse-0.2.0 → datamuse-0.3.0}/datamuse.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: datamuse
-Version: 0.2.0
+Version: 0.3.0
 Summary: datamuse is a simple wrapper around the datamuse api https://www.datamuse.com/api/
 Author-email: Bivas Kumar <thetrotfreak@yahoo.com>
 License-Expression: MIT

{datamuse-0.2.0 → datamuse-0.3.0}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "datamuse"
-version = "0.2.0"
+version = "0.3.0"
 authors = [
     { name="Bivas Kumar", email="thetrotfreak@yahoo.com" },
 ]

{datamuse-0.2.0 → datamuse-0.3.0}/tests/test_datamuse.py RENAMED Viewed

@@ -1,6 +1,6 @@
 import pytest
-from datamuse.annotations import _lookup_related_code
+from datamuse.annotations import _lookup_metadata_flag, _lookup_related_code
 class TestDatamuse:
@@ -83,3 +83,23 @@ class TestDatamuse:
         )
         related = mock.related(word_mock, parameter)
         assert word_mock in related
+    @pytest.mark.parametrize("flag", _lookup_metadata_flag)
+    def test_with_metadata_words(self, datamuse_mock, word_mock, flag):
+        mock = datamuse_mock(
+            method="GET",
+            url="/words",
+            response=[
+                {
+                    "word": word_mock,
+                    "tags": ["u", "n", "v", "adj", "adv"],
+                    "defs": [word_mock],
+                    "numSyllables": len(word_mock),
+                }
+            ],
+            match_query={"ml": word_mock, "md": f"{_lookup_metadata_flag[flag]}"},
+        )
+        synonyms = mock.with_metadata(flag).synonyms(word_mock)
+        assert word_mock in synonyms
+        assert word_mock in mock.metadata
+        assert flag in mock.metadata[word_mock]

datamuse-0.2.0/datamuse/annotations.py DELETED Viewed

@@ -1,40 +0,0 @@
-from types import MappingProxyType
-from typing import Literal, LiteralString, TypeAlias
-Word: TypeAlias = LiteralString
-RelatedWordCode = Literal[
-    "nouns_adjective",
-    "adjectives_noun",
-    "synonyms",
-    "triggers",
-    "antonyms",
-    "hypernyms",
-    "hyponyms",
-    "holonyms",
-    "meronyms",
-    "frequent_followers",
-    "frequent_predecessors",
-    "homophones",
-    "consonant",
-]
-_lookup_related_code = MappingProxyType(
-    {
-        "nouns_adjective": "jja",
-        "adjectives_noun": "jjb",
-        "synonyms": "syn",
-        "triggers": "trg",
-        "antonyms": "ant",
-        "hypernyms": "spc",
-        "hyponyms": "gen",
-        "holonyms": "com",
-        "meronyms": "par",
-        "frequent_followers": "bga",
-        "frequent_predecessors": "bgb",
-        "homophones": "hom",
-        "consonant": "cns",
-    }
-)

datamuse-0.2.0/datamuse/datamuse.py DELETED Viewed

@@ -1,99 +0,0 @@
-import functools
-from typing import final
-import certifi
-import urllib3
-from datamuse.annotations import RelatedWordCode, Word, _lookup_related_code
-@final
-class Datamuse:
-    """
-    The [Datamuse](https://www.datamuse.com/) [API](https://www.datamuse.com/api/) is a word-finding query engine for developers.
-    You can use it in your apps to find words that match a given set of constraints and that are likely in a given context.
-    You can specify a wide variety of constraints on meaning, spelling, sound, and vocabulary in your queries, in any combination.
-    """
-    __API_URL = "api.datamuse.com"
-    __slots__ = ("__pool",)
-    def __init__(self) -> None:
-        self.__pool = urllib3.HTTPSConnectionPool(
-            host=self.__API_URL,
-            port=443,
-            cert_reqs="CERT_REQUIRED",
-            ca_certs=certifi.where(),
-        )
-    @functools.lru_cache
-    def __get_words(self, **kwds: Word | RelatedWordCode) -> list[Word]:
-        response = self.__pool.request(method="GET", url="/words", fields=kwds)
-        return [word["word"] for word in response.json()]
-    @functools.lru_cache
-    def __get_suggestions(self, **kwds: Word | RelatedWordCode) -> list[Word]:
-        response = self.__pool.request(method="GET", url="/sug", fields=kwds)
-        return [word["word"] for word in response.json()]
-    def synonyms(self, ml: Word):
-        """
-        words with a meaning similar to `ml`
-        :param ml: means like
-        """
-        return self.__get_words(ml=ml)
-    def associations(self, ml: Word, start: Word = "*", end: Word = "*"):
-        """
-        words related to `ml`
-        :param ml: means like
-        :param start: start with
-        :param end: end in
-        """
-        return self.__get_words(ml=ml, sp=start + end)
-    def homophones(self, sl: Word):
-        """
-        words that sound like `sl`
-        :param sl: sounds like
-        """
-        return self.__get_words(sl=sl)
-    def pattern(self, start: Word, end: Word, letters: int):
-        """
-        words that start with `start`, end in `end`, and have `letters` in between
-        :param start: start with
-        :param end: end in
-        :param letters: letters in between
-        """
-        return self.__get_words(sp=f"{start[0]}{'?' * letters}{end[0]}")
-    def orthographic_neighbours(self, sp: Word):
-        """
-        words that are spelled similarly to `sp`
-        :param sp: spelled like
-        """
-        return self.__get_words(sp=sp)
-    def related(self, word: Word, rel: RelatedWordCode):
-        """
-        words that are related by `rel`
-        :param word: the word
-        :param rel: related word
-        """
-        return self.__get_words(**{f"rel_{_lookup_related_code[rel]}": word})
-    def suggestions(self, s: Word):
-        """
-        sugesstions from prefix hint string `s`
-        :param s: prefix hint string
-        """
-        return self.__get_suggestions(s=s)