PyPI - amplify-excel-migrator - Versions diffs - 1.1.5__py3-none-any.whl → 1.2.15__py3-none-any.whl - Mend

amplify-excel-migrator 1.1.5py3-none-any.whl → 1.2.15py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (45) hide show

amplify_excel_migrator/__init__.py +17 -0
amplify_excel_migrator/auth/__init__.py +6 -0
amplify_excel_migrator/auth/cognito_auth.py +306 -0
amplify_excel_migrator/auth/provider.py +42 -0
amplify_excel_migrator/cli/__init__.py +5 -0
amplify_excel_migrator/cli/commands.py +165 -0
amplify_excel_migrator/client.py +47 -0
amplify_excel_migrator/core/__init__.py +5 -0
amplify_excel_migrator/core/config.py +98 -0
amplify_excel_migrator/data/__init__.py +7 -0
amplify_excel_migrator/data/excel_reader.py +23 -0
amplify_excel_migrator/data/transformer.py +119 -0
amplify_excel_migrator/data/validator.py +48 -0
amplify_excel_migrator/graphql/__init__.py +8 -0
amplify_excel_migrator/graphql/client.py +137 -0
amplify_excel_migrator/graphql/executor.py +405 -0
amplify_excel_migrator/graphql/mutation_builder.py +80 -0
amplify_excel_migrator/graphql/query_builder.py +194 -0
amplify_excel_migrator/migration/__init__.py +8 -0
amplify_excel_migrator/migration/batch_uploader.py +23 -0
amplify_excel_migrator/migration/failure_tracker.py +92 -0
amplify_excel_migrator/migration/orchestrator.py +143 -0
amplify_excel_migrator/migration/progress_reporter.py +57 -0
amplify_excel_migrator/schema/__init__.py +6 -0
model_field_parser.py → amplify_excel_migrator/schema/field_parser.py +100 -22
amplify_excel_migrator/schema/introspector.py +95 -0
{amplify_excel_migrator-1.1.5.dist-info → amplify_excel_migrator-1.2.15.dist-info}/METADATA +121 -26
amplify_excel_migrator-1.2.15.dist-info/RECORD +40 -0
amplify_excel_migrator-1.2.15.dist-info/entry_points.txt +2 -0
amplify_excel_migrator-1.2.15.dist-info/top_level.txt +2 -0
tests/__init__.py +1 -0
tests/test_cli_commands.py +292 -0
tests/test_client.py +187 -0
tests/test_cognito_auth.py +363 -0
tests/test_config_manager.py +347 -0
tests/test_field_parser.py +615 -0
tests/test_mutation_builder.py +391 -0
tests/test_query_builder.py +384 -0
amplify_client.py +0 -941
amplify_excel_migrator-1.1.5.dist-info/RECORD +0 -9
amplify_excel_migrator-1.1.5.dist-info/entry_points.txt +0 -2
amplify_excel_migrator-1.1.5.dist-info/top_level.txt +0 -3
migrator.py +0 -437
{amplify_excel_migrator-1.1.5.dist-info → amplify_excel_migrator-1.2.15.dist-info}/WHEEL +0 -0
{amplify_excel_migrator-1.1.5.dist-info → amplify_excel_migrator-1.2.15.dist-info}/licenses/LICENSE +0 -0

amplify_client.py DELETED Viewed

@@ -1,941 +0,0 @@
-import asyncio
-import logging
-import sys
-from getpass import getpass
-from typing import Dict, Any
-import aiohttp
-import boto3
-import requests
-import jwt
-import inflect
-from botocore.exceptions import NoCredentialsError, ProfileNotFound, NoRegionError, ClientError
-from pycognito import Cognito, MFAChallengeException
-from pycognito.exceptions import ForceChangePasswordException
-logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(levelname)s - %(message)s")
-logger = logging.getLogger(__name__)
-class AuthenticationError(Exception):
-    """Raised when authentication is required but not completed"""
-    pass
-class GraphQLError(Exception):
-    """Raised when GraphQL query returns errors"""
-    pass
-class AmplifyClient:
-    """
-    Client for Amplify GraphQL using ADMIN_USER_PASSWORD_AUTH flow
-    """
-    def __init__(self, api_endpoint: str, user_pool_id: str, region: str, client_id: str):
-        """
-        Initialize the client
-        Args:
-            api_endpoint: Amplify GraphQL endpoint
-            user_pool_id: Cognito User Pool ID
-            region: AWS region
-            client_id: Cognito App Client ID
-        """
-        self.api_endpoint = api_endpoint
-        self.user_pool_id = user_pool_id
-        self.region = region
-        self.client_id = client_id
-        self.batch_size = 20
-        self.cognito_client = None
-        self.boto_cognito_admin_client = None
-        self.id_token = None
-        self.mfa_tokens = None
-        self.admin_group_name = "ADMINS"
-        self.records_cache = {}
-    def init_cognito_client(self, is_aws_admin: bool, username: str = None, aws_profile: str = None):
-        try:
-            if is_aws_admin:
-                if aws_profile:
-                    session = boto3.Session(profile_name=aws_profile)
-                    self.boto_cognito_admin_client = session.client("cognito-idp", region_name=self.region)
-                else:
-                    # Use default AWS credentials (from ~/.aws/credentials, env vars, or IAM role)
-                    self.boto_cognito_admin_client = boto3.client("cognito-idp", region_name=self.region)
-            else:
-                self.cognito_client = Cognito(
-                    user_pool_id=self.user_pool_id,
-                    client_id=self.client_id,
-                    user_pool_region=self.region,
-                    username=username,
-                )
-        except NoCredentialsError:
-            logger.error("AWS credentials not found. Please configure AWS credentials.")
-            logger.error("Options: 1) AWS CLI: 'aws configure', 2) Environment variables, 3) Pass credentials directly")
-            raise RuntimeError(
-                "Failed to initialize client: No AWS credentials found. "
-                "Run 'aws configure' or set AWS_ACCESS_KEY_ID and AWS_SECRET_ACCESS_KEY environment variables."
-            )
-        except ProfileNotFound:
-            logger.error(f"AWS profile '{aws_profile}' not found")
-            raise RuntimeError(
-                f"Failed to initialize client: AWS profile '{aws_profile}' not found. "
-                f"Available profiles can be found in ~/.aws/credentials"
-            )
-        except NoRegionError:
-            logger.error("No AWS region specified")
-            raise RuntimeError(
-                f"Failed to initialize client: No AWS region specified. "
-                f"Provide region parameter or set AWS_DEFAULT_REGION environment variable."
-            )
-        except ValueError as e:
-            logger.error(f"Invalid parameter: {e}")
-            raise
-        except ClientError as e:
-            error_code = e.response.get("Error", {}).get("Code", "Unknown")
-            error_msg = e.response.get("Error", {}).get("Message", str(e))
-            logger.error(f"AWS Client Error [{error_code}]: {error_msg}")
-            raise RuntimeError(f"Failed to initialize client: AWS error [{error_code}]: {error_msg}")
-        except Exception as e:
-            logger.error(f"Error during client initialization: {e}")
-            raise RuntimeError(f"Failed to initialize client: {e}")
-    def authenticate(self, username: str, password: str, mfa_code: str = None) -> bool:
-        try:
-            if not self.cognito_client:
-                self.init_cognito_client(is_aws_admin=False, username=username)
-            if mfa_code and self.mfa_tokens:
-                if not self._complete_mfa_challenge(mfa_code):
-                    return False
-            else:
-                self.cognito_client.authenticate(password=password)
-            self.id_token = self.cognito_client.id_token
-            self._check_user_in_admins_group(self.id_token)
-            logger.info("✅ Authentication successful")
-            return True
-        except MFAChallengeException as e:
-            logger.warning("MFA required")
-            if hasattr(e, "get_tokens"):
-                self.mfa_tokens = e.get_tokens()
-                mfa_code = input("Enter MFA code: ").strip()
-                if mfa_code:
-                    return self.authenticate(username, password, mfa_code)
-                else:
-                    logger.error("MFA code required but not provided")
-                    return False
-            else:
-                logger.error("MFA challenge received but no session tokens available")
-                return False
-        except ForceChangePasswordException:
-            logger.warning("Password change required")
-            new_password = input("Your password has expired. Enter new password: ").strip()
-            confirm_password = input("Confirm new password: ").strip()
-            if new_password != confirm_password:
-                logger.error("Passwords do not match")
-                return False
-            try:
-                self.cognito_client.new_password_challenge(password, new_password)
-                return self.authenticate(username, new_password)
-            except Exception as e:
-                logger.error(f"Failed to change password: {e}")
-                return False
-        except Exception as e:
-            logger.error(f"Authentication failed: {e}")
-            return False
-    def aws_admin_authenticate(self, username: str, password: str) -> bool:
-        """
-        Requires AWS credentials with cognito-idp:ListUserPoolClients permission
-        """
-        try:
-            if not self.boto_cognito_admin_client:
-                self.init_cognito_client(is_aws_admin=True)
-            print(f"Authenticating {username} using ADMIN_USER_PASSWORD_AUTH flow...")
-            response = self.boto_cognito_admin_client.admin_initiate_auth(
-                UserPoolId=self.user_pool_id,
-                ClientId=self.client_id,
-                AuthFlow="ADMIN_USER_PASSWORD_AUTH",
-                AuthParameters={"USERNAME": username, "PASSWORD": password},
-            )
-            self._check_for_mfa_challenges(response, username)
-            if "AuthenticationResult" in response:
-                self.id_token = response["AuthenticationResult"]["IdToken"]
-            else:
-                logger.error("❌ Authentication failed: No AuthenticationResult in response")
-                return False
-            self._check_user_in_admins_group(self.id_token)
-            print(f"✅ Authentication successful")
-            return True
-        except self.cognito_client.exceptions.NotAuthorizedException as e:
-            logger.error(f"❌ Authentication failed: {e}")
-            return False
-        except self.cognito_client.exceptions.UserNotFoundException:
-            logger.error(f"❌ User not found: {username}")
-            return False
-        except Exception as e:
-            logger.error(f"❌ Error during authentication: {e}")
-            return False
-    def _complete_mfa_challenge(self, mfa_code: str) -> bool:
-        try:
-            if not self.mfa_tokens:
-                logger.error("No MFA session tokens available")
-                return False
-            challenge_name = self.mfa_tokens.get("ChallengeName", "SMS_MFA")
-            if "SOFTWARE_TOKEN" in challenge_name:
-                self.cognito_client.respond_to_software_token_mfa_challenge(code=mfa_code, mfa_tokens=self.mfa_tokens)
-            else:
-                self.cognito_client.respond_to_sms_mfa_challenge(code=mfa_code, mfa_tokens=self.mfa_tokens)
-            logger.info("✅ MFA challenge successful")
-            return True
-        except Exception as e:
-            logger.error(f"MFA challenge failed: {e}")
-            return False
-    def _get_client_id(self) -> str:
-        if self.client_id:
-            return self.client_id
-        try:
-            if not self.boto_cognito_admin_client:
-                self.boto_cognito_admin_client(is_aws_admin=True)
-            response = self.boto_cognito_admin_client.list_user_pool_clients(UserPoolId=self.user_pool_id, MaxResults=1)
-            if response["UserPoolClients"]:
-                client_id = response["UserPoolClients"][0]["ClientId"]
-                return client_id
-            raise Exception("No User Pool clients found")
-        except self.cognito_client.exceptions.ResourceNotFoundException:
-            raise Exception(f"User Pool not found or AWS credentials lack permission")
-        except Exception as e:
-            raise Exception(f"Failed to get Client ID: {e}")
-    def _check_for_mfa_challenges(self, response, username: str) -> bool:
-        if "ChallengeName" in response:
-            challenge = response["ChallengeName"]
-            if challenge == "MFA_SETUP":
-                logger.error("MFA setup required")
-                return False
-            elif challenge == "SMS_MFA" or challenge == "SOFTWARE_TOKEN_MFA":
-                mfa_code = input("Enter MFA code: ")
-                _ = self.cognito_client.admin_respond_to_auth_challenge(
-                    UserPoolId=self.user_pool_id,
-                    ClientId=self.client_id,
-                    ChallengeName=challenge,
-                    Session=response["Session"],
-                    ChallengeResponses={
-                        "USERNAME": username,
-                        "SMS_MFA_CODE" if challenge == "SMS_MFA" else "SOFTWARE_TOKEN_MFA_CODE": mfa_code,
-                    },
-                )
-            elif challenge == "NEW_PASSWORD_REQUIRED":
-                new_password = getpass("Enter new password: ")
-                _ = self.cognito_client.admin_respond_to_auth_challenge(
-                    UserPoolId=self.user_pool_id,
-                    ClientId=self.client_id,
-                    ChallengeName=challenge,
-                    Session=response["Session"],
-                    ChallengeResponses={"USERNAME": username, "NEW_PASSWORD": new_password},
-                )
-        return False
-    def _check_user_in_admins_group(self, id_token: str):
-        print(jwt.__version__)
-        claims = jwt.decode(id_token, options={"verify_signature": False})
-        groups = claims.get("cognito:groups", [])
-        if self.admin_group_name not in groups:
-            raise PermissionError("User is not in ADMINS group")
-    def _request(self, query: str, variables: Dict = None, context: str = None) -> Any | None:
-        """
-        Make a GraphQL request using the ID token
-        Args:
-            query: GraphQL query or mutation
-            variables: Variables for the query
-            context: Optional context string to include in error messages (e.g., row identifier)
-        Returns:
-            Response data
-        """
-        if not self.id_token:
-            raise AuthenticationError("Not authenticated. Call authenticate() first.")
-        headers = {"Authorization": self.id_token, "Content-Type": "application/json"}
-        payload = {"query": query, "variables": variables or {}}
-        context_msg = f" [{context}]" if context else ""
-        try:
-            response = requests.post(self.api_endpoint, headers=headers, json=payload)
-            if response.status_code == 200:
-                result = response.json()
-                if "errors" in result:
-                    raise GraphQLError(f"GraphQL errors{context_msg}: {result['errors']}")
-                return result
-            else:
-                logger.error(f"HTTP Error {response.status_code}{context_msg}: {response.text}")
-                return None
-        except requests.exceptions.ConnectionError as e:
-            logger.error(
-                f"Connection error{context_msg}: Unable to connect to API endpoint. Check your internet connection or the API endpoint URL."
-            )
-            sys.exit(1)
-        except requests.exceptions.Timeout as e:
-            logger.error(f"Request timeout{context_msg}: {e}")
-            return None
-        except requests.exceptions.HTTPError as e:
-            logger.error(f"HTTP error{context_msg}: {e}")
-            return None
-        except GraphQLError as e:
-            logger.error(str(e))
-            return None
-        except requests.exceptions.RequestException as e:
-            logger.error(f"Request error{context_msg}: {e}")
-            return None
-    async def _request_async(
-        self, session: aiohttp.ClientSession, query: str, variables: Dict = None, context: str = None
-    ) -> Any | None:
-        """
-        Async version of _request for parallel GraphQL requests
-        Args:
-            session: aiohttp ClientSession
-            query: GraphQL query or mutation
-            variables: Variables for the query
-            context: Optional context string to include in error messages (e.g., row identifier)
-        Returns:
-            Response data
-        """
-        if not self.id_token:
-            raise AuthenticationError("Not authenticated. Call authenticate() first.")
-        headers = {"Authorization": self.id_token, "Content-Type": "application/json"}
-        payload = {"query": query, "variables": variables or {}}
-        context_msg = f" [{context}]" if context else ""
-        try:
-            async with session.post(self.api_endpoint, headers=headers, json=payload) as response:
-                if response.status == 200:
-                    result = await response.json()
-                    if "errors" in result:
-                        raise GraphQLError(f"GraphQL errors{context_msg}: {result['errors']}")
-                    return result
-                else:
-                    text = await response.text()
-                    error_msg = f"HTTP Error {response.status}{context_msg}: {text}"
-                    logger.error(error_msg)
-                    raise aiohttp.ClientError(error_msg)
-        except aiohttp.ServerTimeoutError as e:
-            error_msg = f"Request timeout{context_msg}: {e}"
-            logger.error(error_msg)
-            raise aiohttp.ServerTimeoutError(error_msg)
-        except aiohttp.ClientConnectionError as e:
-            error_msg = f"Connection error{context_msg}: Unable to connect to API endpoint. {e}"
-            logger.error(error_msg)
-            raise aiohttp.ClientConnectionError(error_msg)
-        except aiohttp.ClientResponseError as e:
-            error_msg = f"HTTP response error{context_msg}: {e}"
-            logger.error(error_msg)
-            raise aiohttp.ClientResponseError(
-                request_info=e.request_info, history=e.history, status=e.status, message=error_msg
-            )
-        except GraphQLError as e:
-            logger.error(str(e))
-            raise
-        except aiohttp.ClientError as e:
-            error_msg = f"Client error{context_msg}: {e}"
-            logger.error(error_msg)
-            raise aiohttp.ClientError(error_msg)
-    async def create_record_async(
-        self, session: aiohttp.ClientSession, data: Dict, model_name: str, primary_field: str
-    ) -> Dict | None:
-        mutation = f"""
-        mutation Create{model_name}($input: Create{model_name}Input!)  {{
-            create{model_name}(input: $input) {{
-                id
-                {primary_field}
-            }}
-        }}
-        """
-        context = f"{model_name}: {primary_field}={data.get(primary_field)}"
-        result = await self._request_async(session, mutation, {"input": data}, context)
-        if result and "data" in result:
-            created = result["data"].get(f"create{model_name}")
-            if created:
-                logger.info(f'Created {model_name} with {primary_field}="{data[primary_field]}" (ID: {created["id"]})')
-            return created
-        else:
-            logger.error(f'Failed to create {model_name} with {primary_field}="{data[primary_field]}"')
-        return None
-    async def check_record_exists_async(
-        self,
-        session: aiohttp.ClientSession,
-        model_name: str,
-        primary_field: str,
-        value: str,
-        is_secondary_index: bool,
-        record: Dict,
-        field_type: str = "String",
-    ) -> Dict | None:
-        context = f"{model_name}: {primary_field}={value}"
-        if is_secondary_index:
-            query_name = f"list{model_name}By{primary_field[0].upper() + primary_field[1:]}"
-            query = f"""
-            query {query_name}(${primary_field}: {field_type}!) {{
-              {query_name}({primary_field}: ${primary_field}) {{
-                items {{
-                    id
-                }}
-              }}
-            }}
-            """
-            result = await self._request_async(session, query, {primary_field: value}, context)
-            if result and "data" in result:
-                items = result["data"].get(query_name, {}).get("items", [])
-                if len(items) > 0:
-                    logger.warning(f'Record with {primary_field}="{value}" already exists in {model_name}')
-                    return None
-        else:
-            query_name = self._get_list_query_name(model_name)
-            query = f"""
-            query List{model_name}s($filter: Model{model_name}FilterInput) {{
-              {query_name}(filter: $filter) {{
-                items {{
-                    id
-                }}
-              }}
-            }}
-            """
-            filter_input = {primary_field: {"eq": value}}
-            result = await self._request_async(session, query, {"filter": filter_input}, context)
-            if result and "data" in result:
-                items = result["data"].get(query_name, {}).get("items", [])
-                if len(items) > 0:
-                    logger.error(f'Record with {primary_field}="{value}" already exists in {model_name}')
-                    return None
-        return record
-    async def upload_batch_async(
-        self, batch: list, model_name: str, primary_field: str, is_secondary_index: bool, field_type: str = "String"
-    ) -> tuple[int, int, list[Dict]]:
-        async with aiohttp.ClientSession() as session:
-            duplicate_checks = [
-                self.check_record_exists_async(
-                    session, model_name, primary_field, record[primary_field], is_secondary_index, record, field_type
-                )
-                for record in batch
-            ]
-            check_results = await asyncio.gather(*duplicate_checks, return_exceptions=True)
-            filtered_batch = []
-            failed_records = []
-            for i, result in enumerate(check_results):
-                if isinstance(result, Exception):
-                    error_msg = str(result)
-                    failed_records.append(
-                        {
-                            "primary_field": primary_field,
-                            "primary_field_value": batch[i].get(primary_field, "Unknown"),
-                            "error": f"Duplicate check error: {error_msg}",
-                        }
-                    )
-                    logger.error(f"Error checking duplicate: {result}")
-                elif result is not None:
-                    filtered_batch.append(result)
-            if not filtered_batch:
-                return 0, len(batch), failed_records
-            create_tasks = [
-                self.create_record_async(session, record, model_name, primary_field) for record in filtered_batch
-            ]
-            results = await asyncio.gather(*create_tasks, return_exceptions=True)
-            for i, result in enumerate(results):
-                if isinstance(result, Exception):
-                    error_msg = str(result)
-                    failed_records.append(
-                        {
-                            "primary_field": primary_field,
-                            "primary_field_value": filtered_batch[i].get(primary_field, "Unknown"),
-                            "error": error_msg,
-                        }
-                    )
-                elif not result:
-                    failed_records.append(
-                        {
-                            "primary_field": primary_field,
-                            "primary_field_value": filtered_batch[i].get(primary_field, "Unknown"),
-                            "error": "Creation failed - no response",
-                        }
-                    )
-            success_count = sum(1 for r in results if r and not isinstance(r, Exception))
-            error_count = len(batch) - success_count
-            return success_count, error_count, failed_records
-    def get_model_structure(self, model_type: str) -> Dict:
-        query = f"""
-        query GetModelType {{
-          __type(name: "{model_type}") {{
-            name
-            kind
-            description
-            fields {{
-              name
-              type {{
-                name
-                kind
-                ofType {{
-                  name
-                  kind
-                  ofType {{
-                    name
-                    kind
-                  }}
-                }}
-              }}
-              description
-            }}
-          }}
-        }}
-        """
-        response = self._request(query)
-        if response and "data" in response and "__type" in response["data"]:
-            return response["data"]["__type"]
-        return {}
-    def get_primary_field_name(self, model_name: str, parsed_model_structure: Dict[str, Any]) -> tuple[str, bool, str]:
-        """
-        Returns: (field_name, is_secondary_index, field_type)
-        """
-        secondary_index = self._get_secondary_index(model_name)
-        if secondary_index:
-            # Find the field type in parsed_model_structure
-            field_type = "String"
-            for field in parsed_model_structure["fields"]:
-                if field["name"] == secondary_index:
-                    field_type = field["type"]
-                    break
-            return secondary_index, True, field_type
-        for field in parsed_model_structure["fields"]:
-            if field["is_required"] and field["is_scalar"] and field["name"] != "id":
-                return field["name"], False, field["type"]
-        logger.error("No suitable primary field found (required scalar field other than id)")
-        return "", False, "String"
-    def _get_secondary_index(self, model_name: str) -> str:
-        query_structure = self.get_model_structure("Query")
-        if not query_structure:
-            logger.error("Query type not found in schema")
-            return ""
-        query_fields = query_structure["fields"]
-        pattern = f"{model_name}By"
-        for query in query_fields:
-            query_name = query["name"]
-            if pattern in query_name:
-                pattern_index = query_name.index(pattern)
-                field_name = query_name[pattern_index + len(pattern) :]
-                return field_name[0].lower() + field_name[1:] if field_name else ""
-        return ""
-    def _get_list_query_name(self, model_name: str) -> str | None:
-        query_structure = self.get_model_structure("Query")
-        if not query_structure:
-            logger.error("Query type not found in schema")
-            return f"list{model_name}s"
-        query_fields = query_structure["fields"]
-        p = inflect.engine()
-        candidates = [f"list{model_name}"]
-        capitals = [i for i, c in enumerate(model_name) if c.isupper()]
-        if len(capitals) > 1:
-            last_word_start = capitals[-1]
-            prefix = model_name[:last_word_start]
-            last_word = model_name[last_word_start:]
-            last_word_plural = str(p.plural(last_word.lower()))  # type: ignore[arg-type]
-            last_word_plural_cap = last_word_plural[0].upper() + last_word_plural[1:] if last_word_plural else ""
-            pascal_plural = f"{prefix}{last_word_plural_cap}"
-            candidates.append(f"list{pascal_plural}")
-        full_plural = str(p.plural(model_name.lower()))  # type: ignore[arg-type]
-        full_plural_cap = full_plural[0].upper() + full_plural[1:] if full_plural else ""
-        candidates.append(f"list{full_plural_cap}")
-        for query in query_fields:
-            query_name = query["name"]
-            if query_name in candidates and "By" not in query_name:
-                return query_name
-        logger.error(f"No list query found for model {model_name}, tried: {candidates}")
-        return None
-    def upload(
-        self, records: list, model_name: str, parsed_model_structure: Dict[str, Any]
-    ) -> tuple[int, int, list[Dict]]:
-        logger.info("Uploading to Amplify backend...")
-        success_count = 0
-        error_count = 0
-        all_failed_records = []
-        num_of_batches = (len(records) + self.batch_size - 1) // self.batch_size
-        primary_field, is_secondary_index, field_type = self.get_primary_field_name(model_name, parsed_model_structure)
-        if not primary_field:
-            logger.error(f"Aborting upload for model {model_name}")
-            return 0, len(records), []
-        for i in range(0, len(records), self.batch_size):
-            batch = records[i : i + self.batch_size]
-            logger.info(f"Uploading batch {i // self.batch_size + 1} / {num_of_batches} ({len(batch)} items)...")
-            batch_success, batch_error, batch_failed_records = asyncio.run(
-                self.upload_batch_async(batch, model_name, primary_field, is_secondary_index, field_type)
-            )
-            success_count += batch_success
-            error_count += batch_error
-            all_failed_records.extend(batch_failed_records)
-            logger.info(
-                f"Processed batch {i // self.batch_size + 1} of model {model_name}: {success_count} success, {error_count} errors"
-            )
-        return success_count, error_count, all_failed_records
-    def list_records_by_secondary_index(
-        self, model_name: str, secondary_index: str, value: str = None, fields: list = None, field_type: str = "String"
-    ) -> Dict | None:
-        if fields is None:
-            fields = ["id", secondary_index]
-        fields_str = "\n".join(fields)
-        all_items = []
-        next_token = None
-        if not value:
-            query_name = self._get_list_query_name(model_name)
-            while True:
-                query = f"""
-                query List{model_name}s($limit: Int, $nextToken: String) {{
-                  {query_name}(limit: $limit, nextToken: $nextToken) {{
-                    items {{
-                        {fields_str}
-                    }}
-                    nextToken
-                  }}
-                }}
-                """
-                variables = {"limit": 1000, "nextToken": next_token}
-                result = self._request(query, variables)
-                if result and "data" in result:
-                    data = result["data"].get(query_name, {})
-                    items = data.get("items", [])
-                    all_items.extend(items)
-                    next_token = data.get("nextToken")
-                    if not next_token:
-                        break
-                else:
-                    break
-        else:
-            query_name = f"list{model_name}By{secondary_index[0].upper() + secondary_index[1:]}"
-            while True:
-                query = f"""
-                query {query_name}(${secondary_index}: {field_type}!, $limit: Int, $nextToken: String) {{
-                  {query_name}({secondary_index}: ${secondary_index}, limit: $limit, nextToken: $nextToken) {{
-                    items {{
-                        {fields_str}
-                    }}
-                    nextToken
-                  }}
-                }}
-                """
-                variables = {secondary_index: value, "limit": 1000, "nextToken": next_token}
-                result = self._request(query, variables)
-                if result and "data" in result:
-                    data = result["data"].get(query_name, {})
-                    items = data.get("items", [])
-                    all_items.extend(items)
-                    next_token = data.get("nextToken")
-                    if not next_token:
-                        break
-                else:
-                    break
-        return all_items if all_items else None
-    def list_records_by_field(
-        self, model_name: str, field_name: str, value: str = None, fields: list = None
-    ) -> Dict | None:
-        if fields is None:
-            fields = ["id", field_name]
-        fields_str = "\n".join(fields)
-        all_items = []
-        next_token = None
-        query_name = self._get_list_query_name(model_name)
-        if not value:
-            while True:
-                query = f"""
-                query List{model_name}s($limit: Int, $nextToken: String) {{
-                  {query_name}(limit: $limit, nextToken: $nextToken) {{
-                    items {{
-                        {fields_str}
-                    }}
-                    nextToken
-                  }}
-                }}
-                """
-                variables = {"limit": 1000, "nextToken": next_token}
-                result = self._request(query, variables)
-                if result and "data" in result:
-                    data = result["data"].get(query_name, {})
-                    items = data.get("items", [])
-                    all_items.extend(items)
-                    next_token = data.get("nextToken")
-                    if not next_token:
-                        break
-                else:
-                    break
-        else:
-            while True:
-                query = f"""
-                query List{model_name}s($filter: Model{model_name}FilterInput, $limit: Int, $nextToken: String) {{
-                  {query_name}(filter: $filter, limit: $limit, nextToken: $nextToken) {{
-                    items {{
-                        {fields_str}
-                    }}
-                    nextToken
-                  }}
-                }}
-                """
-                filter_input = {field_name: {"eq": value}}
-                variables = {"filter": filter_input, "limit": 1000, "nextToken": next_token}
-                result = self._request(query, variables)
-                if result and "data" in result:
-                    data = result["data"].get(query_name, {})
-                    items = data.get("items", [])
-                    all_items.extend(items)
-                    next_token = data.get("nextToken")
-                    if not next_token:
-                        break
-                else:
-                    break
-        return all_items if all_items else None
-    def get_record_by_id(self, model_name: str, record_id: str, fields: list = None) -> Dict | None:
-        if fields is None:
-            fields = ["id"]
-        fields_str = "\n".join(fields)
-        query_name = f"get{model_name}"
-        query = f"""
-        query Get{model_name}($id: ID!) {{
-          {query_name}(id: $id) {{
-            {fields_str}
-          }}
-        }}
-        """
-        result = self._request(query, {"id": record_id})
-        if result and "data" in result:
-            return result["data"].get(query_name)
-        return None
-    def get_records(
-        self,
-        model_name: str,
-        primary_field: str = None,
-        is_secondary_index: bool = None,
-        fields: list = None,
-    ) -> list | None:
-        if model_name in self.records_cache:
-            return self.records_cache[model_name]
-        if not primary_field:
-            return None
-        if is_secondary_index:
-            records = self.list_records_by_secondary_index(model_name, primary_field, fields=fields)
-        else:
-            records = self.list_records_by_field(model_name, primary_field, fields=fields)
-        if records:
-            self.records_cache[model_name] = records
-            logger.debug(f"💾 Cached {len(records)} records for {model_name}")
-        return records
-    def get_record(
-        self,
-        model_name: str,
-        parsed_model_structure: Dict[str, Any] = None,
-        value: str = None,
-        record_id: str = None,
-        primary_field: str = None,
-        is_secondary_index: bool = None,
-        fields: list = None,
-    ) -> Dict | None:
-        if record_id:
-            return self.get_record_by_id(model_name, record_id)
-        if not primary_field:
-            if not parsed_model_structure:
-                logger.error("Parsed model structure required if primary_field not provided")
-                return None
-            primary_field, is_secondary_index, _ = self.get_primary_field_name(model_name, parsed_model_structure)
-        records = self.get_records(model_name, primary_field, is_secondary_index, fields)
-        if not records:
-            return None
-        return next((record for record in records if record.get(primary_field) == value), None)
-    def build_foreign_key_lookups(self, df, parsed_model_structure: Dict[str, Any]) -> Dict[str, Dict[str, str]]:
-        """
-        Build a cache of foreign key lookups for all ID fields in the DataFrame.
-        This pre-fetches all related records to avoid N+1 query problems during row processing.
-        Args:
-            df: pandas DataFrame containing the data to be processed
-            parsed_model_structure: Parsed model structure containing field information
-        Returns:
-            Dictionary mapping model names to lookup dictionaries and primary fields
-        """
-        fk_lookup_cache = {}
-        for field in parsed_model_structure["fields"]:
-            if not field["is_id"]:
-                continue
-            field_name = field["name"][:-2]
-            if field_name not in df.columns:
-                continue
-            if "related_model" in field:
-                related_model = field["related_model"]
-            else:
-                related_model = field_name[0].upper() + field_name[1:]
-            if related_model in fk_lookup_cache:
-                continue
-            try:
-                primary_field, is_secondary_index, _ = self.get_primary_field_name(
-                    related_model, parsed_model_structure
-                )
-                records = self.get_records(related_model, primary_field, is_secondary_index)
-                if records:
-                    lookup = {
-                        str(record.get(primary_field)): record.get("id")
-                        for record in records
-                        if record.get(primary_field)
-                    }
-                    fk_lookup_cache[related_model] = {"lookup": lookup, "primary_field": primary_field}
-                    logger.debug(f"  📦 Cached {len(lookup)} {related_model} records")
-            except Exception as e:
-                logger.warning(f"  ⚠️  Could not pre-fetch {related_model}: {e}")
-        return fk_lookup_cache

amplify-excel-migrator 1.1.5__py3-none-any.whl → 1.2.15__py3-none-any.whl

amplify-excel-migrator 1.1.5py3-none-any.whl → 1.2.15py3-none-any.whl