PyPI - MultiFactor - Versions diffs - 0.2.7__tar.gz → 0.2.9__tar.gz - Mend

MultiFactor 0.2.7tar.gz → 0.2.9tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (25) hide show

{multifactor-0.2.7 → multifactor-0.2.9}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: MultiFactor
-Version: 0.2.7
+Version: 0.2.9
 Summary: 멀티팩터 기반 주식 데이터 수집 패키지
 Author-email: HANHO <hanhoman@gmail.com>
 Classifier: Programming Language :: Python :: 3

{multifactor-0.2.7 → multifactor-0.2.9}/pyproject.toml RENAMED Viewed

@@ -5,7 +5,7 @@ build-backend = "setuptools.build_meta"
 [project]
 # 1. PyPI에 등록될 배포 이름 (pip install MultiFactor)
 name = "MultiFactor"
-version = "0.2.7"
+version = "0.2.9"
 authors = [
   { name="HANHO", email="hanhoman@gmail.com" },
 ]

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/us_stockinfo.py RENAMED Viewed

@@ -3,6 +3,30 @@ import FinanceDataReader as fdr
 import pandas as pd
 import numpy as np
+def clean_us_symbol(symbol):
+    """
+    미국 주식 심볼 표준화 (yfinance 호환 및 데이터 병합 일관성을 위해)
+    예: BRK.B, BRK/B, BRKB -> BRK-B
+        BF.B, BF/B, BFB -> BF-B
+    """
+    if not isinstance(symbol, str):
+        return symbol
+    symbol = symbol.strip().upper()
+    symbol = symbol.replace('/', '-').replace('.', '-')
+    # yfinance에서 하이픈(-) 구분자를 사용하는 대표적인 클래스 주식의 루트 심볼 목록
+    # 구분자 없이 붙어있는 경우(예: BRKB, BFB)만 선별적으로 변환하여
+    # ALB(알베말), APA(APA Corp), BA(보잉), FOXA(폭스), NWSA(뉴스콥) 등의 오탐지를 방지합니다.
+    hyphen_roots = {'BRK', 'BF', 'LEN', 'STZ', 'HEI', 'JW', 'MOG'}
+    for root in hyphen_roots:
+        if symbol == f"{root}A":
+            return f"{root}-A"
+        elif symbol == f"{root}B":
+            return f"{root}-B"
+    return symbol
 def get_us_stockinfo(N=500):
     """
     미국 종목정보 추출 (GitHub 시가총액 데이터 + FDR 상세정보 병합)
@@ -12,6 +36,7 @@ def get_us_stockinfo(N=500):
     try:
         # 1. GitHub에서 최신 S&P 500 데이터 로드 (시가총액 등 순위용)
         df = pd.read_csv(url)
+        df['symbol'] = df['symbol'].astype(str).apply(clean_us_symbol)
         # 2. FDR에서 KR/US 전체 상장 종목 정보 로드 (명칭 일관성 유지)
         df_sp500 = fdr.StockListing('S&P500')
@@ -20,11 +45,27 @@ def get_us_stockinfo(N=500):
         # 3. FDR 데이터 병합 및 중복 제거
         fdr_stocks = pd.concat([df_sp500, df_nasdaq, df_nyse])
+        fdr_stocks['Symbol'] = fdr_stocks['Symbol'].astype(str).apply(clean_us_symbol)
         fdr_stocks = fdr_stocks.drop_duplicates(subset='Symbol')
-        # 4. Symbol 기준으로 조인하여 FDR의 Name을 사용
-        # fdr_stocks 에는 Symbol, Name, Sector, Industry 컬럼이 포함됨
-        df = df.merge(fdr_stocks[['Symbol', 'Name']], left_on='symbol', right_on='Symbol', how='left')
+        # FDR Sector 이름을 GitHub CSV의 industry 대분류 형태로 변환하기 위한 맵핑
+        sector_mapping = {
+            'Information Technology': 'Technology',
+            'Financials': 'Finance',
+            'Materials': 'Basic Materials',
+            'Communication Services': 'Telecommunications'
+        }
+        fdr_stocks['Sector_mapped'] = fdr_stocks['Sector'].map(sector_mapping).fillna(fdr_stocks['Sector'])
+        # 4. Symbol 기준으로 조인하여 FDR의 Name 및 맵핑된 Sector(대분류)를 가져옴
+        df = df.merge(
+            fdr_stocks[['Symbol', 'Name', 'Sector_mapped']],
+            left_on='symbol', right_on='Symbol',
+            how='left'
+        )
+        # GitHub CSV의 industry 컬럼에 결측치(NaN)가 있으면 FDR에서 맵핑한 Sector로 보완
+        df['industry'] = df['industry'].fillna(df['Sector_mapped'])
         # 5. 컬럼명을 기존 시스템과 동일하게 변경 (GitHub의 name 대신 FDR의 Name 사용)
         column_map = {
@@ -56,9 +97,9 @@ def get_us_stockinfo(N=500):
         if 'Symbol' in df.columns:
             df = df.rename(columns={'Symbol': 'Code'})
-    # 7. 종목코드 클렌징 (yfinance 호환을 위해 / 를 - 로 변경. 예: BRK/B -> BRK-B)
+    # 7. 종목코드 클렌징 (yfinance 호환을 위해 표준화 적용)
     if 'Code' in df.columns:
-        df['Code'] = df['Code'].str.replace('/', '-', regex=False)
+        df['Code'] = df['Code'].astype(str).apply(clean_us_symbol)
     # 8. 상위 N개 추출 및 인덱스 초기화
     df = df.head(N).reset_index(drop=True)

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: MultiFactor
-Version: 0.2.7
+Version: 0.2.9
 Summary: 멀티팩터 기반 주식 데이터 수집 패키지
 Author-email: HANHO <hanhoman@gmail.com>
 Classifier: Programming Language :: Python :: 3

{multifactor-0.2.7 → multifactor-0.2.9}/README.md RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/setup.cfg RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/__init__.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/core.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/momentum.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/momentum_one.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/quality.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/quality_one.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/score.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/score_adj_weight.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/stockinfo.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/us_core.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/us_momentum.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/us_quality.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/us_value.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/value.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor/value_one.py RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor.egg-info/requires.txt RENAMED Viewed

File without changes

{multifactor-0.2.7 → multifactor-0.2.9}/src/MultiFactor.egg-info/top_level.txt RENAMED Viewed

File without changes

MultiFactor 0.2.7__tar.gz → 0.2.9__tar.gz

MultiFactor 0.2.7tar.gz → 0.2.9tar.gz