PyPI - dhisana - Versions diffs - 0.0.1.dev85__py3-none-any.whl → 0.0.1.dev236__py3-none-any.whl - Mend

dhisana 0.0.1.dev85py3-none-any.whl → 0.0.1.dev236py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (70) hide show

dhisana/schemas/common.py +33 -0
dhisana/schemas/sales.py +224 -23
dhisana/utils/add_mapping.py +72 -63
dhisana/utils/apollo_tools.py +739 -109
dhisana/utils/built_with_api_tools.py +4 -2
dhisana/utils/cache_output_tools.py +23 -23
dhisana/utils/check_email_validity_tools.py +456 -458
dhisana/utils/check_for_intent_signal.py +1 -2
dhisana/utils/check_linkedin_url_validity.py +34 -8
dhisana/utils/clay_tools.py +3 -2
dhisana/utils/clean_properties.py +3 -1
dhisana/utils/compose_salesnav_query.py +0 -1
dhisana/utils/compose_search_query.py +7 -3
dhisana/utils/composite_tools.py +0 -1
dhisana/utils/dataframe_tools.py +2 -2
dhisana/utils/email_body_utils.py +72 -0
dhisana/utils/email_provider.py +375 -0
dhisana/utils/enrich_lead_information.py +585 -85
dhisana/utils/fetch_openai_config.py +129 -0
dhisana/utils/field_validators.py +1 -1
dhisana/utils/g2_tools.py +0 -1
dhisana/utils/generate_content.py +0 -1
dhisana/utils/generate_email.py +69 -16
dhisana/utils/generate_email_response.py +298 -41
dhisana/utils/generate_flow.py +0 -1
dhisana/utils/generate_linkedin_connect_message.py +19 -6
dhisana/utils/generate_linkedin_response_message.py +156 -65
dhisana/utils/generate_structured_output_internal.py +351 -131
dhisana/utils/google_custom_search.py +150 -44
dhisana/utils/google_oauth_tools.py +721 -0
dhisana/utils/google_workspace_tools.py +391 -25
dhisana/utils/hubspot_clearbit.py +3 -1
dhisana/utils/hubspot_crm_tools.py +771 -167
dhisana/utils/instantly_tools.py +3 -1
dhisana/utils/lusha_tools.py +10 -7
dhisana/utils/mailgun_tools.py +150 -0
dhisana/utils/microsoft365_tools.py +447 -0
dhisana/utils/openai_assistant_and_file_utils.py +121 -177
dhisana/utils/openai_helpers.py +19 -16
dhisana/utils/parse_linkedin_messages_txt.py +2 -3
dhisana/utils/profile.py +37 -0
dhisana/utils/proxy_curl_tools.py +507 -206
dhisana/utils/proxycurl_search_leads.py +426 -0
dhisana/utils/research_lead.py +121 -68
dhisana/utils/sales_navigator_crawler.py +1 -6
dhisana/utils/salesforce_crm_tools.py +323 -50
dhisana/utils/search_router.py +131 -0
dhisana/utils/search_router_jobs.py +51 -0
dhisana/utils/sendgrid_tools.py +126 -91
dhisana/utils/serarch_router_local_business.py +75 -0
dhisana/utils/serpapi_additional_tools.py +290 -0
dhisana/utils/serpapi_google_jobs.py +117 -0
dhisana/utils/serpapi_google_search.py +188 -0
dhisana/utils/serpapi_local_business_search.py +129 -0
dhisana/utils/serpapi_search_tools.py +363 -432
dhisana/utils/serperdev_google_jobs.py +125 -0
dhisana/utils/serperdev_local_business.py +154 -0
dhisana/utils/serperdev_search.py +233 -0
dhisana/utils/smtp_email_tools.py +576 -0
dhisana/utils/test_connect.py +1765 -92
dhisana/utils/trasform_json.py +95 -16
dhisana/utils/web_download_parse_tools.py +0 -1
dhisana/utils/zoominfo_tools.py +2 -3
dhisana/workflow/test.py +1 -1
{dhisana-0.0.1.dev85.dist-info → dhisana-0.0.1.dev236.dist-info}/METADATA +5 -2
dhisana-0.0.1.dev236.dist-info/RECORD +100 -0
{dhisana-0.0.1.dev85.dist-info → dhisana-0.0.1.dev236.dist-info}/WHEEL +1 -1
dhisana-0.0.1.dev85.dist-info/RECORD +0 -81
{dhisana-0.0.1.dev85.dist-info → dhisana-0.0.1.dev236.dist-info}/entry_points.txt +0 -0
{dhisana-0.0.1.dev85.dist-info → dhisana-0.0.1.dev236.dist-info}/top_level.txt +0 -0

dhisana/utils/check_email_validity_tools.py CHANGED Viewed

@@ -1,407 +1,481 @@
+"""
+Email enrichment & validation module
+Adds Findymail support on top of existing ZeroBounce, Hunter and Apollo flows.
+Providers supported
+-------------------
+* Findymail   – email finder (`/search/name`) & verifier (`/verify`)
+* Hunter      – email finder (`/email-finder`) & verifier (`/email-verifier`)
+* ZeroBounce  – guess format (`/guessformat`) & verifier (`/validate`)
+* Apollo      – enrichment fallback (re‑checked with ZeroBounce/Hunter)
+Priority order
+--------------
+Validation:  Findymail → Hunter → ZeroBounce
+Guess/find:  Findymail → Hunter → ZeroBounce → Apollo
+"""
+from __future__ import annotations
 import os
 import json
 import logging
+import re
 from typing import Dict, List, Optional, Any
 import aiohttp
+# ────────────────────────────────────────────────────────────────────────────
+# Dhisana utility imports
+# ────────────────────────────────────────────────────────────────────────────
 from dhisana.schemas.sales import HubSpotLeadInformation
 from dhisana.utils.field_validators import validate_and_clean_email
-from dhisana.utils.hubspot_crm_tools import lookup_contact_by_name_and_domain
-logger = logging.getLogger(__name__)
 from dhisana.utils.apollo_tools import enrich_user_info_with_apollo
 from dhisana.utils.assistant_tool_tag import assistant_tool
 from dhisana.utils.cache_output_tools import cache_output, retrieve_output
-# --------------------------------------------------------------------------------
-# 1. Access Token Helpers
-# --------------------------------------------------------------------------------
+logger = logging.getLogger(__name__)
-def get_zero_bounce_access_token(tool_config: Optional[List[Dict]] = None) -> str:
+# ===========================================================================
+# 0.  FINDYMAIL HELPERS
+# ===========================================================================
+FINDYMAIL_BASE_URL = "https://app.findymail.com/api"
+def get_findymail_access_token(tool_config: Optional[List[Dict]] = None) -> str:
     """
-    Retrieves the ZeroBounce access token from the provided tool configuration or environment.
+    Retrieve the Findymail API key either from tool_config or environment.
+    Tool‑config JSON shape expected:
+        {
+          "name": "findymail",
+          "configuration": [
+              {"name": "apiKey", "value": "<API_KEY>"}
+          ]
+        }
     """
     if tool_config:
-        zerobounce_config = next(
-            (item for item in tool_config if item.get("name") == "zerobounce"), None
+        fm_cfg = next(
+            (item for item in tool_config if item.get("name") == "findymail"), None
         )
-        if zerobounce_config:
-            config_map = {
-                c["name"]: c["value"]
-                for c in zerobounce_config.get("configuration", [])
-                if c
+        if fm_cfg:
+            cfg_map = {
+                c["name"]: c["value"] for c in fm_cfg.get("configuration", []) if c
             }
-            ZERO_BOUNCE_API_KEY = config_map.get("apiKey")
+            api_key = cfg_map.get("apiKey")
         else:
-            logger.warning("ZeroBounce config not provided or missing 'apiKey'.")
-            ZERO_BOUNCE_API_KEY = None
+            api_key = None
     else:
-        logger.warning("ZeroBounce config not provided or missing 'apiKey'.")
-        ZERO_BOUNCE_API_KEY = None
+        api_key = None
+    api_key = api_key or os.getenv("FINDYMAIL_API_KEY")
+    if not api_key:
+        logger.warning(
+            "Findymail integration is not configured. Please configure the connection to Findymail in Integrations."
+        )
+        return ""
+    return api_key
-    ZERO_BOUNCE_API_KEY = ZERO_BOUNCE_API_KEY or os.getenv("ZERO_BOUNCE_API_KEY")
-    if not ZERO_BOUNCE_API_KEY:
-        logger.warning("ZERO_BOUNCE_API_KEY not found in config or env.")
-        return ""  # Return empty so we don't break
-    return ZERO_BOUNCE_API_KEY
+# ===========================================================================
+# 1.  ACCESS‑TOKEN HELPERS FOR EXISTING PROVIDERS
+# ===========================================================================
+def get_zero_bounce_access_token(tool_config: Optional[List[Dict]] = None) -> str:
+    """Retrieve ZeroBounce key from config/env."""
+    if tool_config:
+        zb_cfg = next(
+            (item for item in tool_config if item.get("name") == "zerobounce"), None
+        )
+        if zb_cfg:
+            cfg_map = {
+                c["name"]: c["value"] for c in zb_cfg.get("configuration", []) if c
+            }
+            api_key = cfg_map.get("apiKey")
+        else:
+            api_key = None
+    else:
+        api_key = None
+    api_key = api_key or os.getenv("ZERO_BOUNCE_API_KEY")
+    if not api_key:
+        logger.warning(
+            "ZeroBounce integration is not configured. Please configure the connection to ZeroBounce in Integrations."
+        )
+        return ""
+    return api_key
 def get_hunter_access_token(tool_config: Optional[List[Dict]] = None) -> str:
-    """
-    Retrieves the Hunter.io access token from the provided tool configuration or environment.
-    """
+    """Retrieve Hunter.io key from config/env."""
     if tool_config:
-        hunter_config = next(
+        h_cfg = next(
             (item for item in tool_config if item.get("name") == "hunter"), None
         )
-        if hunter_config:
-            config_map = {
-                c["name"]: c["value"]
-                for c in hunter_config.get("configuration", [])
-                if c
+        if h_cfg:
+            cfg_map = {
+                c["name"]: c["value"] for c in h_cfg.get("configuration", []) if c
             }
-            HUNTER_API_KEY = config_map.get("apiKey")
+            api_key = cfg_map.get("apiKey")
         else:
-            logger.warning("Hunter config not provided or missing 'apiKey'.")
-            HUNTER_API_KEY = None
+            api_key = None
     else:
-        logger.warning("Hunter config not provided or missing 'apiKey'.")
-        HUNTER_API_KEY = None
+        api_key = None
-    HUNTER_API_KEY = HUNTER_API_KEY or os.getenv("HUNTER_API_KEY")
-    if not HUNTER_API_KEY:
-        logger.warning("HUNTER_API_KEY not found in config or env.")
-        return ""  # Return empty so we don't break
+    api_key = api_key or os.getenv("HUNTER_API_KEY")
+    if not api_key:
+        logger.warning(
+            "Hunter integration is not configured. Please configure the connection to Hunter in Integrations."
+        )
+        return ""
+    return api_key
-    return HUNTER_API_KEY
+# ===========================================================================
+# 2.  VALIDATION FUNCTIONS
+# ===========================================================================
-# --------------------------------------------------------------------------------
-# 2. Provider-Specific Validation Functions
-# --------------------------------------------------------------------------------
-def _map_zerobounce_status_to_confidence(status: str) -> str:
+@assistant_tool
+async def check_email_validity_with_findymail(
+    email_id: str,
+    tool_config: Optional[List[Dict]] = None,
+) -> Dict[str, Any]:
     """
-    Map ZeroBounce's status string to "high", "medium", or "low" confidence.
+    Validate deliverability using Findymail `/verify` endpoint.
+    Returns
+    -------
+    {
+        "email": str,
+        "confidence": "high" | "low",
+        "is_valid": bool
+    }
     """
+    logger.info("Entering check_email_validity_with_findymail: %s", email_id)
+    if not email_id or not re.fullmatch(r"[^@]+@[^@]+\.[^@]+", email_id):
+        return {"email": email_id, "confidence": "low", "is_valid": False}
+    cache_key = f"findymail:{email_id}"
+    cached = retrieve_output("findymail_validate", cache_key)
+    if cached:
+        return json.loads(cached[0])
+    api_key = get_findymail_access_token(tool_config)
+    if not api_key:
+        return {"email": email_id, "confidence": "low", "is_valid": False}
+    url = f"{FINDYMAIL_BASE_URL}/verify"
+    headers = {"Authorization": f"Bearer {api_key}", "Content-Type": "application/json"}
+    try:
+        async with aiohttp.ClientSession() as session:
+            async with session.post(url, json={"email": email_id}, headers=headers) as r:
+                if r.status != 200:
+                    logger.warning("[Findymail] verify non‑200: %s", r.status)
+                    result = {"email": email_id, "confidence": "low", "is_valid": False}
+                else:
+                    data = await r.json()
+                    verified = bool(data.get("verified") or data.get("result") == "verified")
+                    result = {
+                        "email": email_id,
+                        "confidence": "high" if verified else "low",
+                        "is_valid": verified,
+                    }
+    except Exception as ex:
+        logger.exception("[Findymail] verify exception: %s", ex)
+        result = {"email": email_id, "confidence": "low", "is_valid": False}
+    cache_output("findymail_validate", cache_key, [json.dumps(result)])
+    return result
+# ───── ZeroBounce mapping/validation ───────────────────────────────────────
+def _map_zerobounce_status_to_confidence(status: str) -> str:
     status = status.lower()
     if status == "valid":
         return "high"
-    elif status in ["catch-all", "unknown"]:
+    if status in ("catch-all", "unknown"):
         return "medium"
-    elif status in ["spamtrap", "invalid"]:
-        return "low"
     return "low"
 @assistant_tool
 async def check_email_validity_with_zero_bounce(
     email_id: str,
-    tool_config: Optional[List[Dict]] = None
+    tool_config: Optional[List[Dict]] = None,
 ) -> Dict[str, Any]:
-    """
-    Validate a single email address using the ZeroBounce API, with caching.
-    Returns: {
-      "email": str,
-      "confidence": "high"|"medium"|"low",
-      "is_valid": bool
-    }
-    """
-    logger.info("Entering check_email_validity_with_zero_bounce for email_id: %s", email_id)
-    import re
+    logger.info("Entering check_email_validity_with_zero_bounce: %s", email_id)
     if not email_id or not re.fullmatch(r"[^@]+@[^@]+\.[^@]+", email_id):
-        return {
-            "email": email_id,
-            "confidence": "low",
-            "is_valid": False
-        }
+        return {"email": email_id, "confidence": "low", "is_valid": False}
-    cache_key = f"{email_id}"
-    cached_response = retrieve_output("zerobounce_validate", cache_key)
-    if cached_response is not None:
-        logger.info("Cache hit for ZeroBounce validate.")
-        if not cached_response:
-            return {
-                "email": email_id,
-                "confidence": "low",
-                "is_valid": False
-            }
-        return json.loads(cached_response[0])
-    # Get API key
-    ZERO_BOUNCE_API_KEY = get_zero_bounce_access_token(tool_config)
-    if not ZERO_BOUNCE_API_KEY:
-        logger.warning("No ZeroBounce API key available. Returning low confidence.")
-        return {
-            "email": email_id,
-            "confidence": "low",
-            "is_valid": False
-        }
+    cache_key = f"zerobounce:{email_id}"
+    cached = retrieve_output("zerobounce_validate", cache_key)
+    if cached:
+        return json.loads(cached[0])
-    url = (
-        "https://api.zerobounce.net/v2/validate"
-        f"?api_key={ZERO_BOUNCE_API_KEY}&email={email_id}"
-    )
+    api_key = get_zero_bounce_access_token(tool_config)
+    if not api_key:
+        return {"email": email_id, "confidence": "low", "is_valid": False}
+    url = f"https://api.zerobounce.net/v2/validate?api_key={api_key}&email={email_id}"
     try:
         async with aiohttp.ClientSession() as session:
-            async with session.get(url) as response:
-                if response.status != 200:
-                    content = await safe_read_json_or_text(response)
-                    logger.warning(
-                        f"[ZeroBounce] Non-200 status: {response.status} => {content}"
-                    )
-                    # Return fallback instead of raising
-                    final_response = {
+            async with session.get(url) as r:
+                if r.status != 200:
+                    logger.warning("[ZeroBounce] non‑200: %s", r.status)
+                    result = {"email": email_id, "confidence": "low", "is_valid": False}
+                else:
+                    data = await r.json()
+                    conf = _map_zerobounce_status_to_confidence(data.get("status", ""))
+                    result = {
                         "email": email_id,
-                        "confidence": "low",
-                        "is_valid": False
+                        "confidence": conf,
+                        "is_valid": conf == "high",
                     }
-                    cache_output("zerobounce_validate", cache_key, [json.dumps(final_response)])
-                    return final_response
-                result = await response.json()
     except Exception as ex:
-        logger.warning(f"[ZeroBounce] Exception occurred => {ex}")
-        return {
-            "email": email_id,
-            "confidence": "low",
-            "is_valid": False
-        }
+        logger.exception("[ZeroBounce] validate exception: %s", ex)
+        result = {"email": email_id, "confidence": "low", "is_valid": False}
-    zb_status = result.get("status", "").lower()  # e.g. "valid", "invalid"
-    confidence = _map_zerobounce_status_to_confidence(zb_status)
-    is_valid = (confidence == "high")
+    cache_output("zerobounce_validate", cache_key, [json.dumps(result)])
+    return result
-    final_response = {
-        "email": email_id,
-        "confidence": confidence,
-        "is_valid": is_valid
-    }
-    cache_output("zerobounce_validate", cache_key, [json.dumps(final_response)])
-    logger.info("Exiting check_email_validity_with_zero_bounce.")
-    return final_response
+# ───── Hunter mapping/validation ───────────────────────────────────────────
-def _map_hunter_status_to_confidence(hunter_result: str) -> str:
-    """
-    Map Hunter's email verifier result to "high", "medium", or "low" confidence.
-    Possible results: deliverable, undeliverable, risky, unknown, accept_all.
-    """
-    val = hunter_result.lower()
-    if val == "deliverable":
+def _map_hunter_status_to_confidence(status: str) -> str:
+    status = status.lower()
+    if status == "deliverable":
         return "high"
-    elif val in ["risky", "unknown", "accept_all"]:
+    if status in ("unknown", "accept_all"):
         return "medium"
-    elif val == "undeliverable":
-        return "low"
     return "low"
 @assistant_tool
 async def check_email_validity_with_hunter(
     email_id: str,
-    tool_config: Optional[List[Dict]] = None
+    tool_config: Optional[List[Dict]] = None,
 ) -> Dict[str, Any]:
-    """
-    Validate a single email address using Hunter.io's email verification API.
-    Returns: {
-      "email": str,
-      "confidence": "high"|"medium"|"low",
-      "is_valid": bool
-    }
-    """
-    logger.info("Entering check_email_validity_with_hunter for email_id: %s", email_id)
-    import re
+    logger.info("Entering check_email_validity_with_hunter: %s", email_id)
     if not email_id or not re.fullmatch(r"[^@]+@[^@]+\.[^@]+", email_id):
-        return {
-            "email": email_id,
-            "confidence": "low",
-            "is_valid": False
-        }
+        return {"email": email_id, "confidence": "low", "is_valid": False}
-    HUNTER_API_KEY = get_hunter_access_token(tool_config)
-    if not HUNTER_API_KEY:
-        logger.warning("No Hunter API key available. Returning low confidence.")
-        return {
-            "email": email_id,
-            "confidence": "low",
-            "is_valid": False
-        }
+    cache_key = f"hunter:{email_id}"
+    cached = retrieve_output("hunter_validate", cache_key)
+    if cached:
+        return json.loads(cached[0])
-    url = (
-        "https://api.hunter.io/v2/email-verifier"
-        f"?email={email_id}&api_key={HUNTER_API_KEY}"
-    )
+    api_key = get_hunter_access_token(tool_config)
+    if not api_key:
+        return {"email": email_id, "confidence": "low", "is_valid": False}
+    url = f"https://api.hunter.io/v2/email-verifier?email={email_id}&api_key={api_key}"
     try:
         async with aiohttp.ClientSession() as session:
-            async with session.get(url) as response:
-                if response.status != 200:
-                    content = await safe_read_json_or_text(response)
-                    logger.warning(f"[Hunter] Non-200 status: {response.status} => {content}")
-                    return {
+            async with session.get(url) as r:
+                if r.status != 200:
+                    logger.warning("[Hunter] non‑200: %s", r.status)
+                    result = {"email": email_id, "confidence": "low", "is_valid": False}
+                else:
+                    data = await r.json()
+                    res = data.get("data", {}).get("result", "")
+                    conf = _map_hunter_status_to_confidence(res)
+                    result = {
                         "email": email_id,
-                        "confidence": "low",
-                        "is_valid": False
+                        "confidence": conf,
+                        "is_valid": conf == "high",
                     }
+    except Exception as ex:
+        logger.exception("[Hunter] validate exception: %s", ex)
+        result = {"email": email_id, "confidence": "low", "is_valid": False}
+    cache_output("hunter_validate", cache_key, [json.dumps(result)])
+    return result
+# ===========================================================================
+# 3.  GUESS / FIND FUNCTIONS
+# ===========================================================================
+@assistant_tool
+async def guess_email_with_findymail(
+    first_name: str,
+    last_name: str,
+    domain: str,
+    user_linkedin_url: Optional[str] = None,
+    middle_name: Optional[str] = None,
+    tool_config: Optional[List[Dict]] = None,
+) -> Dict[str, Any]:
+    """Use Findymail to guess an email.
+    If ``user_linkedin_url`` is provided, the function queries ``/search/linkedin``.
+    Otherwise it falls back to ``/search/name`` with ``first_name``/``last_name``
+    and ``domain``. Only verified emails are returned and therefore considered
+    high confidence.
+    """
+    logger.info("Entering guess_email_with_findymail")
+    if user_linkedin_url:
+        cache_key = f"findymail:{user_linkedin_url}"
+    else:
+        if not first_name or not last_name or not domain:
+            return {"email": "", "email_confidence": "low"}
+        cache_key = f"findymail:{first_name}_{last_name}_{domain}"
+    api_key = get_findymail_access_token(tool_config)
+    if not api_key:
+        return {"email": "", "email_confidence": "low"}
+    cached = retrieve_output("findymail_guess", cache_key)
+    if cached:
+        return json.loads(cached[0])
+    if user_linkedin_url:
+        url = f"{FINDYMAIL_BASE_URL}/search/linkedin"
+        payload = {"linkedin_url": user_linkedin_url, "webhook_url": None}
+    else:
+        url = f"{FINDYMAIL_BASE_URL}/search/name"
+        full_name = " ".join(filter(None, [first_name, middle_name, last_name]))
+        payload = {"name": full_name, "domain": domain}
+    headers = {"Authorization": f"Bearer {api_key}", "Content-Type": "application/json"}
-                result = await response.json()
+    try:
+        async with aiohttp.ClientSession() as session:
+            async with session.post(url, headers=headers, json=payload) as r:
+                if r.status != 200:
+                    logger.warning("[Findymail] search non‑200: %s", r.status)
+                    result = {"email": "", "email_confidence": "low"}
+                else:
+                    data = await r.json()
+                    contact = data.get("contact")
+                    found = contact.get("email", "") if contact else ""
+                    if found:
+                        result = {
+                            "email": found,
+                            "email_confidence": "high",
+                            "contact_info": json.dumps(contact) if contact else "",
+                        }
+                    else:
+                        result = {"email": "", "email_confidence": "low"}
     except Exception as ex:
-        logger.warning(f"[Hunter] Exception occurred => {ex}")
-        return {
-            "email": email_id,
-            "confidence": "low",
-            "is_valid": False
-        }
+        logger.exception("[Findymail] search exception: %s", ex)
+        result = {"email": "", "email_confidence": "low"}
-    data = result.get("data", {})
-    verifier_result = data.get("result", "")  # "deliverable", "undeliverable", etc.
-    confidence = _map_hunter_status_to_confidence(verifier_result)
-    is_valid = (confidence == "high")
+    cache_output("findymail_guess", cache_key, [json.dumps(result)])
+    return result
-    final_response = {
-        "email": email_id,
-        "confidence": confidence,
-        "is_valid": is_valid
-    }
-    logger.info("Exiting check_email_validity_with_hunter.")
-    return final_response
+# ───── ZeroBounce guess ────────────────────────────────────────────────────
-# --------------------------------------------------------------------------------
-# 3. Provider-Specific Guessing Functions
-# --------------------------------------------------------------------------------
 @assistant_tool
 async def guess_email_with_zero_bounce(
     first_name: str,
     last_name: str,
     domain: str,
-    user_linkedin_url: Optional[str] = None,  # Ignored by ZeroBounce
+    user_linkedin_url: Optional[str] = None,  # unused
     middle_name: Optional[str] = None,
-    tool_config: Optional[List[Dict]] = None
+    tool_config: Optional[List[Dict]] = None,
 ) -> Dict[str, Any]:
-    """
-    Attempt to guess the email using ZeroBounce's guessFormat endpoint, with caching.
-    We assume the API returns an "email" and an "email_confidence" field.
-    """
-    logger.info("Entering guess_email_with_zero_bounce.")
+    logger.info("Entering guess_email_with_zero_bounce")
     if not first_name or not last_name or not domain:
-        logger.error("Required parameters first_name, last_name, and domain must be provided.")
         return {"email": "", "email_confidence": "low"}
-    cache_key = f"{first_name}_{last_name}_{domain}_{middle_name or ''}"
-    cached_response = retrieve_output("zerobounce_guess", cache_key)
-    if cached_response is not None:
-        logger.info("Cache hit for ZeroBounce guess.")
-        return json.loads(cached_response[0]) if cached_response else {"email": "", "email_confidence": "low"}
-    ZERO_BOUNCE_API_KEY = get_zero_bounce_access_token(tool_config)
-    if not ZERO_BOUNCE_API_KEY:
-        logger.warning("No ZeroBounce API key available. Returning low confidence guess.")
+    api_key = get_zero_bounce_access_token(tool_config)
+    if not api_key:
         return {"email": "", "email_confidence": "low"}
-    base_url = "https://api.zerobounce.net/v2/guessformat"
-    query_params = (
-        f"?api_key={ZERO_BOUNCE_API_KEY}"
-        f"&domain={domain}"
-        f"&first_name={first_name}"
-        f"&middle_name={middle_name or ''}"
-        f"&last_name={last_name}"
+    cache_key = f"zerobounce:guess:{first_name}_{last_name}_{domain}_{middle_name or ''}"
+    cached = retrieve_output("zerobounce_guess", cache_key)
+    if cached:
+        return json.loads(cached[0])
+    url = (
+        "https://api.zerobounce.net/v2/guessformat"
+        f"?api_key={api_key}&domain={domain}"
+        f"&first_name={first_name}&middle_name={middle_name or ''}&last_name={last_name}"
     )
-    url = base_url + query_params
     try:
         async with aiohttp.ClientSession() as session:
-            async with session.get(url) as response:
-                if response.status != 200:
-                    content = await safe_read_json_or_text(response)
-                    logger.warning(f"[ZeroBounce] guessFormat error: {response.status} => {content}")
-                    return {"email": "", "email_confidence": "low"}
-                result = await response.json()
+            async with session.get(url) as r:
+                if r.status != 200:
+                    logger.warning("[ZeroBounce] guessformat non‑200: %s", r.status)
+                    result = {"email": "", "email_confidence": "low"}
+                else:
+                    data = await r.json()
+                    if "email_confidence" not in data:
+                        data["email_confidence"] = (
+                            "high" if data.get("email") else "low"
+                        )
+                    result = data
     except Exception as ex:
-        logger.warning(f"[ZeroBounce] Exception => {ex}")
-        return {"email": "", "email_confidence": "low"}
-    # If the API doesn't provide "email_confidence", you can supply a fallback:
-    if "email_confidence" not in result:
-        result["email_confidence"] = "medium" if result.get("email") else "low"
+        logger.exception("[ZeroBounce] guess exception: %s", ex)
+        result = {"email": "", "email_confidence": "low"}
     cache_output("zerobounce_guess", cache_key, [json.dumps(result)])
-    logger.info("Exiting guess_email_with_zero_bounce.")
     return result
+# ───── Hunter guess ────────────────────────────────────────────────────────
 @assistant_tool
 async def guess_email_with_hunter(
     first_name: str,
     last_name: str,
     domain: str,
-    user_linkedin_url: Optional[str] = None,  # Ignored by Hunter
+    user_linkedin_url: Optional[str] = None,  # unused
     middle_name: Optional[str] = None,
-    tool_config: Optional[List[Dict]] = None
+    tool_config: Optional[List[Dict]] = None,
 ) -> Dict[str, Any]:
-    """
-    Attempt to guess the email using Hunter.io's email-finder endpoint.
-    We'll interpret the "score" (0-100) from the response and map it to "email_confidence".
-    """
-    logger.info("Entering guess_email_with_hunter.")
+    logger.info("Entering guess_email_with_hunter")
     if not first_name or not last_name or not domain:
-        logger.error("Required parameters first_name, last_name, and domain must be provided.")
         return {"email": "", "email_confidence": "low"}
-    HUNTER_API_KEY = get_hunter_access_token(tool_config)
-    if not HUNTER_API_KEY:
-        logger.warning("No Hunter API key available. Returning low-confidence guess.")
+    api_key = get_hunter_access_token(tool_config)
+    if not api_key:
         return {"email": "", "email_confidence": "low"}
     url = (
         "https://api.hunter.io/v2/email-finder"
-        f"?domain={domain}"
-        f"&first_name={first_name}"
-        f"&last_name={last_name}"
-        f"&api_key={HUNTER_API_KEY}"
+        f"?domain={domain}&first_name={first_name}&last_name={last_name}"
+        f"&api_key={api_key}"
     )
-    # If needed, you could pass middle_name, e.g. "&middle_name={middle_name}"
     try:
         async with aiohttp.ClientSession() as session:
-            async with session.get(url) as response:
-                if response.status != 200:
-                    content = await safe_read_json_or_text(response)
-                    logger.warning(f"[Hunter] email-finder error: {response.status} => {content}")
-                    return {"email": "", "email_confidence": "low"}
-                result = await response.json()
+            async with session.get(url) as r:
+                if r.status != 200:
+                    logger.warning("[Hunter] email-finder non‑200: %s", r.status)
+                    result = {"email": "", "email_confidence": "low"}
+                else:
+                    data = await r.json()
+                    email = data.get("data", {}).get("email", "")
+                    score = float(data.get("data", {}).get("score", 0) or 0)
+                    if score >= 80:
+                        conf = "high"
+                    elif score >= 50:
+                        conf = "medium"
+                    else:
+                        conf = "low"
+                    result = {"email": email, "email_confidence": conf}
     except Exception as ex:
-        logger.warning(f"[Hunter] Exception => {ex}")
-        return {"email": "", "email_confidence": "low"}
+        logger.exception("[Hunter] guess exception: %s", ex)
+        result = {"email": "", "email_confidence": "low"}
-    data = result.get("data", {})
-    found_email = data.get("email", "")
+    return result
-    # Safely parse numeric score
-    raw_score = data.get("score")  # might be int, float, None, or not present
-    try:
-        score = float(raw_score) if raw_score is not None else 0.0
-    except (ValueError, TypeError):
-        score = 0.0
-    if score >= 80:
-        confidence = "high"
-    elif score >= 50:
-        confidence = "medium"
-    else:
-        confidence = "low"
-    output = {
-        "email": found_email,
-        "email_confidence": confidence
-    }
-    logger.info("Exiting guess_email_with_hunter.")
-    return output
+# ───── Apollo guess (fallback) ─────────────────────────────────────────────
 @assistant_tool
@@ -411,115 +485,87 @@ async def guess_email_with_apollo(
     domain: str,
     user_linkedin_url: Optional[str] = None,
     middle_name: Optional[str] = None,
-    tool_config: Optional[List[Dict]] = None
+    tool_config: Optional[List[Dict]] = None,
 ) -> Dict[str, Any]:
-    """
-    Attempt to guess/enrich an email using Apollo, then re-check with ZeroBounce
-    to ensure we have acceptable confidence.
-    """
-    logger.info("Entering guess_email_with_apollo.")
+    logger.info("Entering guess_email_with_apollo")
     if not first_name or not last_name or not domain:
-        logger.error("Required parameters first_name, last_name, and domain must be provided.")
         return {"email": "", "email_confidence": "low"}
-    # If Apollo config is absent, return low
-    apollo_config = next((item for item in tool_config or [] if item.get("name") == "apollo"), None)
-    if not apollo_config:
-        logger.warning("No Apollo config found; cannot enrich with Apollo.")
+    apollo_cfg = next(
+        (item for item in tool_config or [] if item.get("name") == "apollo"), None
+    )
+    if not apollo_cfg:
         return {"email": "", "email_confidence": "low"}
-    input_lead_info = {
+    input_lead = {
         "first_name": first_name,
         "last_name": last_name,
         "primary_domain_of_organization": domain,
-        "user_linkedin_url": user_linkedin_url or ""
+        "user_linkedin_url": user_linkedin_url or "",
     }
     try:
-        # Attempt to enrich
-        response = await enrich_user_info_with_apollo(input_lead_info, tool_config)
+        enriched = await enrich_user_info_with_apollo(input_lead, tool_config)
     except Exception as ex:
-        logger.warning(f"[Apollo] Exception => {ex}")
-        return {"email": "", "email_confidence": "low"}
+        logger.exception("[Apollo] enrich exception: %s", ex)
+        enriched = {}
-    apollo_email = response.get("email", "")
+    apollo_email = enriched.get("email", "")
     if not apollo_email:
-        # No email found
         return {"email": "", "email_confidence": "low"}
-    # Now re-check with ZeroBounce for final confidence
-    zb_result = await check_email_validity_with_zero_bounce(apollo_email, tool_config)
-    # If ZeroBounce says "high" or "medium" => we keep it, else "low"
-    zb_conf = zb_result.get("confidence", "low")
-    if zb_conf in ["high", "medium"]:
-        return {
-            "email": apollo_email,
-            "email_confidence": zb_conf
-        }
-    else:
-        return {
-            "email": apollo_email,
-            "email_confidence": "low"
-        }
+    # quick re‑check with Hunter
+    validation = await check_email_validity_with_hunter(apollo_email, tool_config)
+    conf = validation.get("confidence", "low")
+    return {"email": apollo_email, "email_confidence": conf}
+# ─── Provider map
 GUESS_EMAIL_TOOL_MAP = {
-    "zerobounce": guess_email_with_zero_bounce,
+    "findymail": guess_email_with_findymail,
     "hunter": guess_email_with_hunter,
+    "zerobounce": guess_email_with_zero_bounce,
     "apollo": guess_email_with_apollo,
 }
+# ===========================================================================
+# 4.  AGGREGATORS
+# ===========================================================================
-# --------------------------------------------------------------------------------
-# 4. Aggregators (High-Level Validation + Guess)
-# --------------------------------------------------------------------------------
 @assistant_tool
 async def check_email_validity(
     email_id: str,
-    tool_config: Optional[List[Dict]] = None
+    tool_config: Optional[List[Dict]] = None,
 ) -> Dict[str, Any]:
     """
-    Validate an email address by checking each provider in priority order:
-      1) ZeroBounce
-      2) Hunter
-    If a provider returns high confidence, we stop. Otherwise we continue.
+    Validate by provider priority:
+        1) Findymail  2) Hunter  3) ZeroBounce
     """
-    logger.info("Entering check_email_validity method.")
+    logger.info("Entering check_email_validity")
     if not tool_config:
-        logger.warning("No tool configuration found; returning low confidence.")
-        return {
-            "email": email_id,
-            "confidence": "low",
-            "is_valid": False
-        }
+        return {"email": email_id, "confidence": "low", "is_valid": False}
-    provider_names = [item.get("name") for item in tool_config if item.get("name")]
-    # No mention of Apollo for direct validation, so keep the same priority:
-    priority = ["zerobounce", "hunter"]
+    names = [c.get("name") for c in tool_config if c.get("name")]
+    priority = ["findymail", "hunter", "zerobounce"]
-    final_result = {
-        "email": email_id,
-        "confidence": "low",
-        "is_valid": False
-    }
+    result: Dict[str, Any] = {"email": email_id, "confidence": "low", "is_valid": False}
     for provider in priority:
-        if provider in provider_names:
-            if provider == "zerobounce":
-                result = await check_email_validity_with_zero_bounce(email_id, tool_config)
-            elif provider == "hunter":
-                result = await check_email_validity_with_hunter(email_id, tool_config)
-            else:
-                continue
+        if provider not in names:
+            continue
+        if provider == "findymail":
+            result = await check_email_validity_with_findymail(email_id, tool_config)
+        elif provider == "hunter":
+            result = await check_email_validity_with_hunter(email_id, tool_config)
+        else:
+            result = await check_email_validity_with_zero_bounce(email_id, tool_config)
-            final_result = result
-            # If "high" confidence, stop
-            if result["confidence"] == "high":
-                logger.info(f"{provider} gave high confidence. Stopping further checks.")
-                break
+        if result["confidence"] in ("high", "low"):
+            break
-    logger.info("Exiting check_email_validity method with result: %s", final_result)
-    return final_result
+    logger.info("Exiting check_email_validity with %s", result)
+    return result
 @assistant_tool
@@ -529,191 +575,143 @@ async def guess_email(
     domain: str,
     middle_name: Optional[str] = None,
     user_linkedin_url: Optional[str] = None,
-    tool_config: Optional[List[Dict]] = None
+    tool_config: Optional[List[Dict]] = None,
 ) -> Dict[str, Any]:
     """
-    Attempt to guess/enrich the email using provider(s) indicated in the tool_config,
-    in the priority order:
-      1) Hunter
-      2) ZeroBounce
-      3) Apollo  (last resort, re-check with ZeroBounce)
-    If the first guess is "high" confidence, we stop. Otherwise move on, etc.
+    Guess by provider priority:
+        1) Findymail  2) Hunter  3) ZeroBounce  4) Apollo
     """
-    logger.info("Entering guess_email method.")
+    logger.info("Entering guess_email")
     if not tool_config:
-        logger.warning("No tool configuration found; returning low-confidence guess.")
         return {"email": "", "email_confidence": "low"}
-    provider_names = [item.get("name") for item in tool_config if item.get("name")]
-    priority = ["zerobounce",  "apollo"]
-    final_result = {"email": "", "email_confidence": "low"}
+    names = [c.get("name") for c in tool_config if c.get("name")]
+    priority = ["findymail", "hunter", "zerobounce", "apollo"]
+    result: Dict[str, Any] = {"email": "", "email_confidence": "low"}
     for provider in priority:
-        if provider in provider_names:
-            guess_func = GUESS_EMAIL_TOOL_MAP[provider]
-            result = await guess_func(
-                first_name,
-                last_name,
-                domain,
-                user_linkedin_url,
-                middle_name,
-                tool_config
-            )
-            final_result = result
-            if result.get("email_confidence") == "high":
-                logger.info(f"{provider} gave high confidence on guess. Stopping further guesses.")
-                break
-            # If you want to stop at "medium" as well, you could:
-            # if result.get("email_confidence") in ["high", "medium"]:
-            #    break
-    logger.info("Exiting guess_email method with result: %s", final_result)
-    return final_result
-# --------------------------------------------------------------------------------
-# 5. Orchestrating everything in a single function
-# --------------------------------------------------------------------------------
+        if provider not in names:
+            continue
+        guess_fn = GUESS_EMAIL_TOOL_MAP[provider]
+        result = await guess_fn(
+            first_name,
+            last_name,
+            domain,
+            user_linkedin_url,
+            middle_name,
+            tool_config,
+        )
+        if result.get("email_confidence") == "high":
+            break
+    logger.info("Exiting guess_email with %s", result)
+    return result
+# ===========================================================================
+# 5.  PROCESS EMAIL PROPERTIES (unchanged except provider names usable)
+# ===========================================================================
 @assistant_tool
 async def process_email_properties(
     input_properties: Dict[str, Any],
-    tool_config: Optional[List[Dict]] = None
+    tool_config: Optional[List[Dict]] = None,
 ) -> Dict[str, Any]:
-    logger.info("Entering process_email_properties.")
+    """Central orchestrator used elsewhere in Dhisana."""
+    logger.info("Entering process_email_properties")
     first_name = input_properties.get("first_name", "")
     last_name = input_properties.get("last_name", "")
-    email = input_properties.get("email", "")
-    email = validate_and_clean_email(email)
+    email = validate_and_clean_email(input_properties.get("email", ""))
     additional_properties = input_properties.get("additional_properties", {})
     user_linkedin_url = input_properties.get("user_linkedin_url", "")
     domain = input_properties.get("primary_domain_of_organization", "")
     if email:
-        # Validate existing email
-        val_result = await check_email_validity(email, tool_config)
-        is_valid = val_result.get("is_valid", False)
-        confidence = val_result.get("confidence", "").lower()  # e.g. 'high', 'medium', 'low'
-        if is_valid and confidence == "high":
-            # Already good
+        val = await check_email_validity(email, tool_config)
+        if val["is_valid"] and val["confidence"] == "high":
             input_properties["email_validation_status"] = "valid"
         else:
-            # Invalid or medium/low -> mark invalid
             input_properties["email_validation_status"] = "invalid"
     else:
-        # No existing email -> must guess if domain is present
         if not domain:
-            logger.info("No primary domain found; cannot guess.")
-            additional_properties["guessed_email"] = ""
-            input_properties["email"] = ""
             input_properties["email_validation_status"] = "invalid"
+            input_properties["email"] = ""
         else:
-            # --- FIX STARTS HERE ---
+            # Try HubSpot lookup first (disabled by default)
             hubspot_lead_info = None
-            #TODO: test more and enable
             # hubspot_lead_info = await lookup_contact_by_name_and_domain(
-            #     first_name,
-            #     last_name,
-            #     domain,
-            #     tool_config=tool_config
+            #     first_name, last_name, domain, tool_config=tool_config
             # )
             if (
                 hubspot_lead_info
                 and isinstance(hubspot_lead_info, HubSpotLeadInformation)
                 and hubspot_lead_info.email
             ):
-                # We found a HubSpot email; validate it
                 hubspot_email = hubspot_lead_info.email
-                val_result = await check_email_validity(hubspot_email, tool_config)
-                is_valid = val_result.get("is_valid", False)
-                confidence = val_result.get("confidence", "").lower()
-                input_properties["email"] = hubspot_email
-                if is_valid and confidence == "high":
-                    # Accept HubSpot email
+                val = await check_email_validity(hubspot_email, tool_config)
+                if val["is_valid"] and val["confidence"] == "high":
                     input_properties["email"] = hubspot_email
                     input_properties["email_validation_status"] = "valid"
                 else:
-                    # HubSpot email is not high-confidence => guess
-                    guessed_result = await guess_email(
+                    g = await guess_email(
                         first_name,
                         last_name,
                         domain,
                         "",
                         user_linkedin_url,
-                        tool_config
+                        tool_config,
                     )
-                    if is_guess_usable(guessed_result):
-                        if guessed_result.get("email_confidence", "").lower() == "high":
-                            input_properties["email"] = guessed_result["email"]
+                    if is_guess_usable(g):
+                        input_properties["email"] = g["email"]
+                        if g["email_confidence"] == "high":
                             input_properties["email_validation_status"] = "valid"
                         else:
-                            additional_properties["guessed_email"] = guessed_result.get("email", "")
-                            input_properties["email"] = guessed_result.get("email", "")
                             input_properties["email_validation_status"] = "invalid"
-                    else:
-                        additional_properties["guessed_email"] = guessed_result.get("email", "")
-                        input_properties["email"] = guessed_result.get("email", "")
-                        input_properties["email_validation_status"] = "invalid"
+                            additional_properties["guessed_email"] = g["email"]
             else:
-                # No valid HubSpot match => guess
-                guessed_result = await guess_email(
+                g = await guess_email(
                     first_name,
                     last_name,
                     domain,
                     "",
                     user_linkedin_url,
-                    tool_config
+                    tool_config,
                 )
-                if is_guess_usable(guessed_result):
-                    if guessed_result.get("email_confidence", "").lower() == "high":
-                        input_properties["email"] = guessed_result["email"]
-                        input_properties["email_validation_status"] = "valid"
-                    else:
-                        additional_properties["guessed_email"] = guessed_result.get("email", "")
-                        input_properties["email"] = guessed_result["email"]
-                        input_properties["email_validation_status"] = "invalid"
+                input_properties["email"] = g["email"]
+                if is_guess_usable(g) and g["email_confidence"] == "high":
+                    input_properties["email_validation_status"] = "valid"
                 else:
-                    additional_properties["guessed_email"] = guessed_result.get("email", "")
-                    input_properties["email"] = guessed_result.get("email", "")
                     input_properties["email_validation_status"] = "invalid"
-            # --- FIX ENDS HERE ---
+                    additional_properties["guessed_email"] = g["email"]
     input_properties["additional_properties"] = additional_properties
-    logger.info("Exiting process_email_properties.")
+    logger.info("Exiting process_email_properties")
     return input_properties
-# --------------------------------------------------------------------------------
-# 6. Helper Functions
-# --------------------------------------------------------------------------------
+# ===========================================================================
+# 6.  HELPER FUNCTIONS
+# ===========================================================================
 async def safe_read_json_or_text(response: aiohttp.ClientResponse) -> Any:
-    """
-    Safely attempts to parse an aiohttp response as JSON, else returns text.
-    """
+    """Attempt JSON parsing; fallback to text."""
     try:
         return await response.json()
-    except Exception:
+    except Exception:  # noqa: BLE001
         return await response.text()
 def extract_domain(email: str) -> str:
-    """Extract domain from email ( user@domain.com -> domain.com )."""
-    if "@" not in email:
-        return ""
-    return email.split("@")[-1].strip()
+    """user@domain.com → domain.com"""
+    return email.split("@")[-1].strip() if "@" in email else ""
 def is_guess_usable(guess_result: Dict[str, Any]) -> bool:
-    """
-    Decide if a guessed email is "usable".
-    Here we treat "high" or "medium" as usable.
-    Adjust as needed.
-    """
+    """Treat high/medium as usable."""
     if not guess_result:
         return False
-    email_confidence = guess_result.get("email_confidence", "").lower()
-    return email_confidence in ["high", "medium"]
+    return guess_result.get("email_confidence", "").lower() in ("high", "medium")

dhisana 0.0.1.dev85__py3-none-any.whl → 0.0.1.dev236__py3-none-any.whl

dhisana 0.0.1.dev85py3-none-any.whl → 0.0.1.dev236py3-none-any.whl