neurostats-API 0.0.14__py3-none-any.whl → 0.0.15__py3-none-any.whl
Sign up to get free protection for your applications and to get access to all the features.
- neurostats_API/__init__.py +13 -1
- neurostats_API/fetchers/__init__.py +2 -0
- neurostats_API/fetchers/base.py +102 -4
- neurostats_API/fetchers/tech.py +34 -7
- neurostats_API/fetchers/tej_finance_report.py +313 -0
- neurostats_API/utils/__init__.py +2 -1
- neurostats_API/utils/calculate_value.py +26 -0
- neurostats_API/utils/data_process.py +56 -1
- {neurostats_API-0.0.14.dist-info → neurostats_API-0.0.15.dist-info}/METADATA +68 -3
- {neurostats_API-0.0.14.dist-info → neurostats_API-0.0.15.dist-info}/RECORD +12 -10
- {neurostats_API-0.0.14.dist-info → neurostats_API-0.0.15.dist-info}/WHEEL +1 -1
- {neurostats_API-0.0.14.dist-info → neurostats_API-0.0.15.dist-info}/top_level.txt +0 -0
neurostats_API/__init__.py
CHANGED
@@ -1 +1,13 @@
|
|
1
|
-
__version__='0.0.
|
1
|
+
__version__='0.0.15'
|
2
|
+
|
3
|
+
from .fetchers import (
|
4
|
+
BalanceSheetFetcher,
|
5
|
+
CashFlowFetcher,
|
6
|
+
FinanceOverviewFetcher,
|
7
|
+
FinanceReportFetcher,
|
8
|
+
InstitutionFetcher,
|
9
|
+
MarginTradingFetcher,
|
10
|
+
MonthRevenueFetcher,
|
11
|
+
TechFetcher,
|
12
|
+
ProfitLoseFetcher
|
13
|
+
)
|
@@ -2,6 +2,8 @@ from .base import StatsDateTime, StatsFetcher
|
|
2
2
|
from .balance_sheet import BalanceSheetFetcher
|
3
3
|
from .cash_flow import CashFlowFetcher
|
4
4
|
from .finance_overview import FinanceOverviewFetcher
|
5
|
+
from .tej_finance_report import FinanceReportFetcher
|
6
|
+
from .tech import TechFetcher
|
5
7
|
from .institution import InstitutionFetcher
|
6
8
|
from .margin_trading import MarginTradingFetcher
|
7
9
|
from .month_revenue import MonthRevenueFetcher
|
neurostats_API/fetchers/base.py
CHANGED
@@ -1,16 +1,16 @@
|
|
1
|
+
import abc
|
1
2
|
from pymongo import MongoClient
|
2
3
|
import pandas as pd
|
3
4
|
import json
|
4
5
|
import pytz
|
5
6
|
from datetime import datetime, timedelta, date
|
6
|
-
from ..utils import StatsDateTime, StatsProcessor
|
7
|
+
from ..utils import StatsDateTime, StatsProcessor, YoY_Calculator
|
7
8
|
import yaml
|
8
9
|
|
9
10
|
class StatsFetcher:
|
10
11
|
def __init__(self, ticker, db_client):
|
11
12
|
self.ticker = ticker
|
12
|
-
self.db = db_client[
|
13
|
-
"company"] # Replace with your database name
|
13
|
+
self.db = db_client["company"] # Replace with your database name
|
14
14
|
self.collection = self.db["twse_stats"]
|
15
15
|
|
16
16
|
self.timezone = pytz.timezone("Asia/Taipei")
|
@@ -37,7 +37,7 @@ class StatsFetcher:
|
|
37
37
|
]
|
38
38
|
|
39
39
|
def collect_data(self, start_date, end_date):
|
40
|
-
pipeline = self.prepare_query(
|
40
|
+
pipeline = self.prepare_query()
|
41
41
|
|
42
42
|
fetched_data = list(self.collection.aggregate(pipeline))
|
43
43
|
|
@@ -52,3 +52,101 @@ class StatsFetcher:
|
|
52
52
|
season = (month - 1) // 3 + 1
|
53
53
|
|
54
54
|
return StatsDateTime(date, year, month, day, season)
|
55
|
+
|
56
|
+
class BaseTEJFetcher(abc.ABC):
|
57
|
+
def __init__(self):
|
58
|
+
self.client = None
|
59
|
+
self.db = None
|
60
|
+
self.collection = None
|
61
|
+
|
62
|
+
@abc.abstractmethod
|
63
|
+
def get(self):
|
64
|
+
pass
|
65
|
+
|
66
|
+
def get_latest_data_time(self, ticker):
|
67
|
+
latest_data = self.collection.find_one(
|
68
|
+
{"ticker": ticker},
|
69
|
+
{"last_update": 1, "_id" : 0}
|
70
|
+
)
|
71
|
+
|
72
|
+
try:
|
73
|
+
latest_date = latest_data['last_update']["latest_data_date"]
|
74
|
+
except Exception as e:
|
75
|
+
latest_date = None
|
76
|
+
|
77
|
+
return latest_date
|
78
|
+
|
79
|
+
def cal_YoY(self, data_dict: dict, start_year: int, end_year: int):
|
80
|
+
year_shifts = [1,3,5,10]
|
81
|
+
return_dict = {}
|
82
|
+
for year in range(start_year, end_year+1):
|
83
|
+
year_data = data_dict[str(year)]
|
84
|
+
year_keys = list(year_data.keys())
|
85
|
+
for key in year_keys:
|
86
|
+
if (key in 'season'):
|
87
|
+
continue
|
88
|
+
|
89
|
+
if (isinstance(year_data[key], (int, float))):
|
90
|
+
temp_dict = {"value": year_data[key]}
|
91
|
+
|
92
|
+
for shift in year_shifts:
|
93
|
+
this_value = year_data[key]
|
94
|
+
try:
|
95
|
+
past_year = str(year - shift)
|
96
|
+
last_value = data_dict[past_year][key]['value']
|
97
|
+
temp_dict[f"YoY_{shift}"] = YoY_Calculator.cal_growth(
|
98
|
+
this_value, last_value, delta = shift
|
99
|
+
)
|
100
|
+
except Exception as e:
|
101
|
+
temp_dict[f"YoY_{shift}"] = None
|
102
|
+
|
103
|
+
year_data[key] = temp_dict
|
104
|
+
|
105
|
+
else:
|
106
|
+
year_data.pop(key)
|
107
|
+
|
108
|
+
return_dict[year] = year_data
|
109
|
+
|
110
|
+
|
111
|
+
return return_dict
|
112
|
+
|
113
|
+
def cal_QoQ(self, data_dict):
|
114
|
+
return_dict = {}
|
115
|
+
for i, time_index in enumerate(data_dict.keys()):
|
116
|
+
year, season = time_index.split("Q")
|
117
|
+
year = int(year)
|
118
|
+
season = int(season)
|
119
|
+
if (season == 1):
|
120
|
+
last_year = year - 1
|
121
|
+
last_season = 4
|
122
|
+
else:
|
123
|
+
last_year = year
|
124
|
+
last_season = season - 1
|
125
|
+
|
126
|
+
this_data = data_dict[time_index]
|
127
|
+
this_keys = list(this_data.keys())
|
128
|
+
for key in this_keys:
|
129
|
+
if (key in 'season'):
|
130
|
+
continue
|
131
|
+
|
132
|
+
this_value = this_data[key]
|
133
|
+
|
134
|
+
if (isinstance(this_value, (int, float))):
|
135
|
+
temp_dict = {"value": this_value}
|
136
|
+
|
137
|
+
try:
|
138
|
+
last_value = data_dict[f"{last_year}Q{last_season}"][key]['value']
|
139
|
+
|
140
|
+
temp_dict['growth'] = YoY_Calculator.cal_growth(
|
141
|
+
this_value, last_value, delta=1
|
142
|
+
)
|
143
|
+
except Exception as e:
|
144
|
+
temp_dict['growth'] = None
|
145
|
+
|
146
|
+
this_data[key] = temp_dict
|
147
|
+
|
148
|
+
else:
|
149
|
+
this_data.pop(key)
|
150
|
+
return_dict[time_index] = this_data
|
151
|
+
return return_dict
|
152
|
+
|
neurostats_API/fetchers/tech.py
CHANGED
@@ -1,9 +1,16 @@
|
|
1
1
|
from .base import StatsFetcher
|
2
2
|
import pandas as pd
|
3
|
+
import yfinance as yf
|
3
4
|
|
4
5
|
class TechFetcher(StatsFetcher):
|
5
6
|
|
6
7
|
def __init__(self, ticker:str, db_client):
|
8
|
+
|
9
|
+
"""
|
10
|
+
The Capitalization-Weighted Index includes the following tickers:
|
11
|
+
['GSPC', 'IXIC', 'DJI', 'TWII']
|
12
|
+
"""
|
13
|
+
|
7
14
|
super().__init__(ticker, db_client)
|
8
15
|
self.full_ohlcv = self._get_ohlcv()
|
9
16
|
self.basic_indexes = ['SMA5', 'SMA20', 'SMA60', 'EMA5', 'EMA20',
|
@@ -40,16 +47,36 @@ class TechFetcher(StatsFetcher):
|
|
40
47
|
)
|
41
48
|
|
42
49
|
def _get_ohlcv(self):
|
43
|
-
|
44
|
-
|
50
|
+
|
51
|
+
if self.ticker in ['GSPC', 'IXIC', 'DJI', 'TWII']:
|
52
|
+
|
53
|
+
full_tick = f'^{self.ticker}'
|
54
|
+
yf_ticker = yf.Ticker(full_tick)
|
55
|
+
origin_df = yf_ticker.history(period="10y")
|
56
|
+
origin_df = origin_df.reset_index()
|
57
|
+
origin_df["Date"] = pd.to_datetime(origin_df["Date"]).dt.date
|
58
|
+
df = origin_df.rename(
|
59
|
+
columns={
|
60
|
+
"Date": "date",
|
61
|
+
"Open": "open",
|
62
|
+
"High": "high",
|
63
|
+
"Low": "low",
|
64
|
+
"Close": "close",
|
65
|
+
"Volume": "volume"
|
66
|
+
}
|
67
|
+
)
|
68
|
+
else:
|
69
|
+
|
70
|
+
query = {'ticker': self.ticker}
|
71
|
+
ticker_full = list(self.collection.find(query))
|
45
72
|
|
46
|
-
|
47
|
-
|
73
|
+
if not ticker_full:
|
74
|
+
raise ValueError(f"No data found for ticker: {self.ticker}")
|
48
75
|
|
49
|
-
|
50
|
-
|
76
|
+
if 'daily_data' not in ticker_full[0] or ticker_full[0]['daily_data'] is None:
|
77
|
+
raise KeyError("Missing 'daily_data' in the retrieved data")
|
51
78
|
|
52
|
-
|
79
|
+
df = pd.DataFrame(ticker_full[0]['daily_data'])
|
53
80
|
|
54
81
|
selected_cols = ['date','open','high','low','close','volume']
|
55
82
|
|
@@ -0,0 +1,313 @@
|
|
1
|
+
from .base import BaseTEJFetcher
|
2
|
+
from datetime import datetime
|
3
|
+
from enum import Enum
|
4
|
+
import pandas as pd
|
5
|
+
from pymongo import MongoClient
|
6
|
+
from ..utils import StatsProcessor, YoY_Calculator
|
7
|
+
import warnings
|
8
|
+
|
9
|
+
|
10
|
+
class FinanceReportFetcher(BaseTEJFetcher):
|
11
|
+
class FetchMode(Enum):
|
12
|
+
YOY = 1
|
13
|
+
QOQ = 2
|
14
|
+
YOY_NOCAL = 3
|
15
|
+
QOQ_NOCAL = 4
|
16
|
+
|
17
|
+
def __init__(self, mongo_uri, db_name = "company", collection_name = "TWN/AINVFQ1"):
|
18
|
+
self.client = MongoClient(mongo_uri)
|
19
|
+
self.db = self.client[db_name]
|
20
|
+
self.collection = self.db[collection_name]
|
21
|
+
|
22
|
+
self.check_index = {
|
23
|
+
'coid', 'mdate', 'key3', 'no',
|
24
|
+
'sem', 'merg', 'curr', 'annd',
|
25
|
+
'fin_ind', 'bp11', 'bp21', 'bp22',
|
26
|
+
'bp31', 'bp41', 'bp51', 'bp53',
|
27
|
+
'bp61', 'bp62', 'bp63', 'bp64',
|
28
|
+
'bp65', 'bf11', 'bf12', 'bf21',
|
29
|
+
'bf22', 'bf41', 'bf42', 'bf43',
|
30
|
+
'bf44', 'bf45', 'bf99', 'bsca',
|
31
|
+
'bsnca', 'bsta','bscl','bsncl',
|
32
|
+
'bstl','bsse','bslse','debt',
|
33
|
+
'quick','ppe','ar','ip12',
|
34
|
+
'ip22','ip31','ip51','iv41',
|
35
|
+
'if11','isibt','isni','isnip',
|
36
|
+
'eps','ispsd','gm','opi',
|
37
|
+
'nri','ri','nopi','ebit',
|
38
|
+
'cip31','cscfo','cscfi','cscff',
|
39
|
+
'person','shares','wavg','taxrate',
|
40
|
+
'r104','r115','r105','r106',
|
41
|
+
'r107','r108','r201','r112',
|
42
|
+
'r401','r402','r403','r404',
|
43
|
+
'r405','r408','r409','r410',
|
44
|
+
'r502','r501','r205','r505',
|
45
|
+
'r517','r512','r509','r608',
|
46
|
+
'r616','r610','r607','r613',
|
47
|
+
'r612','r609','r614','r611',
|
48
|
+
'r307','r304','r305','r306',
|
49
|
+
'r316','r834'
|
50
|
+
}
|
51
|
+
|
52
|
+
def get(
|
53
|
+
self,
|
54
|
+
ticker,
|
55
|
+
fetch_mode: FetchMode = FetchMode.QOQ,
|
56
|
+
start_date: str = None,
|
57
|
+
end_date: str = None,
|
58
|
+
report_type: str = "Q",
|
59
|
+
indexes: list = []
|
60
|
+
):
|
61
|
+
"""
|
62
|
+
基礎的query function
|
63
|
+
ticker(str): 股票代碼
|
64
|
+
start_date(str): 開頭日期範圍
|
65
|
+
end_date(str): = 結束日期範圍
|
66
|
+
report_type(str): 報告型態 {"A", "Q", "TTM"}
|
67
|
+
fetch_mode(class FetchMode):
|
68
|
+
YoY : 起始日期到結束日期範圍內,特定該季的資料
|
69
|
+
QoQ : 起始日期到結束日期內,每季的資料(與上一季成長率)
|
70
|
+
indexes(List): 指定的index
|
71
|
+
"""
|
72
|
+
# 確認indexes中是否有錯誤的index,有的話回傳warning
|
73
|
+
if (indexes and self.check_index):
|
74
|
+
indexes = set(indexes)
|
75
|
+
difference = indexes-self.check_index
|
76
|
+
if (difference):
|
77
|
+
warnings.warn(
|
78
|
+
f"{list(difference)} 沒有出現在資料表中,請確認column名稱是否正確",
|
79
|
+
UserWarning
|
80
|
+
)
|
81
|
+
|
82
|
+
|
83
|
+
if (fetch_mode in {
|
84
|
+
self.FetchMode.QOQ,
|
85
|
+
self.FetchMode.QOQ_NOCAL
|
86
|
+
}
|
87
|
+
):
|
88
|
+
if (not start_date):
|
89
|
+
warnings.warn("No start_date specified, use default date = \"2005-01-01\"", UserWarning)
|
90
|
+
start_date = datetime.strptime("2005-01-01", "%Y-%m-%d")
|
91
|
+
if (not end_date):
|
92
|
+
warnings.warn("No end_date specified, use default date = today", UserWarning)
|
93
|
+
end_date = datetime.today()
|
94
|
+
|
95
|
+
assert (start_date <= end_date)
|
96
|
+
start_date = datetime.strptime(start_date, "%Y-%m-%d")
|
97
|
+
end_date = datetime.strptime(end_date, "%Y-%m-%d")
|
98
|
+
|
99
|
+
start_year = start_date.year
|
100
|
+
start_season = (start_date.month - 1) // 4 + 1
|
101
|
+
end_year = end_date.year
|
102
|
+
end_season = (end_date.month - 1) // 4 + 1
|
103
|
+
|
104
|
+
if (fetch_mode == self.FetchMode.QOQ):
|
105
|
+
use_cal = True
|
106
|
+
else:
|
107
|
+
use_cal = False
|
108
|
+
|
109
|
+
data_df = self.get_QoQ_data(
|
110
|
+
ticker=ticker,
|
111
|
+
start_year=start_year,
|
112
|
+
start_season=start_season,
|
113
|
+
end_year=end_year,
|
114
|
+
end_season=end_season,
|
115
|
+
report_type=report_type,
|
116
|
+
indexes=indexes,
|
117
|
+
use_cal=use_cal
|
118
|
+
)
|
119
|
+
|
120
|
+
return data_df
|
121
|
+
|
122
|
+
elif (fetch_mode in {
|
123
|
+
self.FetchMode.YOY,
|
124
|
+
self.FetchMode.YOY_NOCAL
|
125
|
+
}
|
126
|
+
):
|
127
|
+
start_year = 2005
|
128
|
+
end_date = self.get_latest_data_time(ticker)
|
129
|
+
if (not end_date):
|
130
|
+
end_date = datetime.today()
|
131
|
+
|
132
|
+
end_year = end_date.year
|
133
|
+
season = (end_date.month - 1) // 4 + 1
|
134
|
+
|
135
|
+
if (fetch_mode == self.FetchMode.YOY):
|
136
|
+
use_cal = True
|
137
|
+
else:
|
138
|
+
use_cal = False
|
139
|
+
|
140
|
+
data_df = self.get_YoY_data(
|
141
|
+
ticker = ticker,
|
142
|
+
start_year = start_year,
|
143
|
+
end_year = end_year,
|
144
|
+
season = season,
|
145
|
+
report_type = report_type,
|
146
|
+
indexes = indexes
|
147
|
+
)
|
148
|
+
|
149
|
+
return data_df
|
150
|
+
|
151
|
+
def get_QoQ_data(
|
152
|
+
self,
|
153
|
+
ticker,
|
154
|
+
start_year,
|
155
|
+
start_season,
|
156
|
+
end_year,
|
157
|
+
end_season,
|
158
|
+
report_type = "Q",
|
159
|
+
indexes = [],
|
160
|
+
use_cal = False
|
161
|
+
):
|
162
|
+
"""
|
163
|
+
取得時間範圍內每季資料
|
164
|
+
"""
|
165
|
+
if (not indexes): # 沒有指定 -> 取全部
|
166
|
+
pipeline = [
|
167
|
+
{ "$match": { "ticker": ticker } },
|
168
|
+
{ "$unwind": "$data" },
|
169
|
+
{ "$match": {
|
170
|
+
"$or": [
|
171
|
+
{ "data.year": { "$gt": start_year, "$lt": end_year } },
|
172
|
+
{ "data.year": start_year, "data.season": { "$gte": start_season } },
|
173
|
+
{ "data.year": end_year, "data.season": { "$lte": end_season } }
|
174
|
+
]
|
175
|
+
}},
|
176
|
+
{ "$project": {
|
177
|
+
"data.year": 1,
|
178
|
+
"data.season": 1,
|
179
|
+
f"data.{report_type}": 1,
|
180
|
+
"_id": 0
|
181
|
+
}
|
182
|
+
}
|
183
|
+
]
|
184
|
+
|
185
|
+
|
186
|
+
else: # 取指定index
|
187
|
+
project_stage = {
|
188
|
+
"data.year": 1,
|
189
|
+
"data.season": 1
|
190
|
+
}
|
191
|
+
for index in indexes:
|
192
|
+
project_stage[f"data.{report_type}.{index}"] = 1
|
193
|
+
|
194
|
+
pipeline = [
|
195
|
+
{ "$match": { "ticker": ticker } },
|
196
|
+
{ "$unwind": "$data" },
|
197
|
+
{ "$match": {
|
198
|
+
"$or": [
|
199
|
+
{ "data.year": { "$gt": start_year, "$lt": end_year } },
|
200
|
+
{ "data.year": start_year, "data.season": { "$gte": start_season } },
|
201
|
+
{ "data.year": end_year, "data.season": { "$lte": end_season } }
|
202
|
+
]
|
203
|
+
}},
|
204
|
+
{ "$project": project_stage }
|
205
|
+
]
|
206
|
+
|
207
|
+
|
208
|
+
fetched_data = self.collection.aggregate(pipeline).to_list()
|
209
|
+
|
210
|
+
data_dict = StatsProcessor.list_of_dict_to_dict(
|
211
|
+
fetched_data,
|
212
|
+
keys = ["year", "season"],
|
213
|
+
delimeter = "Q",
|
214
|
+
data_key=report_type
|
215
|
+
)
|
216
|
+
if (use_cal):
|
217
|
+
data_with_QoQ = self.cal_QoQ(data_dict)
|
218
|
+
data_df = pd.DataFrame.from_dict(data_with_QoQ)
|
219
|
+
else:
|
220
|
+
data_df = pd.DataFrame.from_dict(data_dict)
|
221
|
+
return data_df
|
222
|
+
|
223
|
+
def get_YoY_data(
|
224
|
+
self,
|
225
|
+
ticker,
|
226
|
+
start_year,
|
227
|
+
end_year,
|
228
|
+
season,
|
229
|
+
report_type = "Q",
|
230
|
+
indexes = [],
|
231
|
+
use_cal = False
|
232
|
+
):
|
233
|
+
"""
|
234
|
+
取得某季歷年資料
|
235
|
+
"""
|
236
|
+
if (use_cal):
|
237
|
+
select_year = set()
|
238
|
+
|
239
|
+
for year in range(start_year, end_year + 1):
|
240
|
+
year_shifts = {
|
241
|
+
year,
|
242
|
+
year - 1,
|
243
|
+
year - 3,
|
244
|
+
year - 5,
|
245
|
+
year - 10
|
246
|
+
}
|
247
|
+
|
248
|
+
select_year = select_year.union(year_shifts)
|
249
|
+
|
250
|
+
select_year = sorted(list(select_year), reverse=True)
|
251
|
+
else:
|
252
|
+
select_year = [year for year in range(start_year, end_year + 1)]
|
253
|
+
|
254
|
+
if (not indexes): # 沒有指定 -> 取全部
|
255
|
+
pipeline = [
|
256
|
+
{ "$match": { "ticker": ticker } },
|
257
|
+
{ "$unwind": "$data" },
|
258
|
+
{ "$match": {
|
259
|
+
"$or":[
|
260
|
+
{
|
261
|
+
"$and": [
|
262
|
+
{ "data.year": {"$in": select_year }},
|
263
|
+
{ "data.season": {"$eq": season}}
|
264
|
+
]
|
265
|
+
},
|
266
|
+
]
|
267
|
+
}},
|
268
|
+
{ "$project": {
|
269
|
+
"data.year": 1,
|
270
|
+
"data.season": 1,
|
271
|
+
f"data.{report_type}": 1,
|
272
|
+
"_id": 0
|
273
|
+
}
|
274
|
+
}
|
275
|
+
]
|
276
|
+
|
277
|
+
|
278
|
+
else: # 取指定index
|
279
|
+
project_stage = {
|
280
|
+
"data.year": 1,
|
281
|
+
"data.season": 1
|
282
|
+
}
|
283
|
+
for index in indexes:
|
284
|
+
project_stage[f"data.{report_type}.{index}"] = 1
|
285
|
+
|
286
|
+
pipeline = [
|
287
|
+
{ "$match": { "ticker": ticker } },
|
288
|
+
{ "$unwind": "$data" },
|
289
|
+
{ "$match": {
|
290
|
+
"$and": [
|
291
|
+
{ "data.year": {"$in": select_year}},
|
292
|
+
{ "data.season": {"$eq": season}}
|
293
|
+
]
|
294
|
+
}},
|
295
|
+
{ "$project": project_stage }
|
296
|
+
]
|
297
|
+
|
298
|
+
fetched_data = self.collection.aggregate(pipeline).to_list()
|
299
|
+
|
300
|
+
# 處理計算YoY
|
301
|
+
data_dict = StatsProcessor.list_of_dict_to_dict(
|
302
|
+
fetched_data,
|
303
|
+
keys = ['year', 'season'],
|
304
|
+
data_key=report_type,
|
305
|
+
delimeter='Q'
|
306
|
+
)
|
307
|
+
if (use_cal):
|
308
|
+
data_with_YoY = self.cal_YoY(data_dict, start_year, end_year)
|
309
|
+
result_df = pd.DataFrame.from_dict(data_with_YoY)
|
310
|
+
else:
|
311
|
+
result_df = pd.DataFrame.from_dict(data_dict)
|
312
|
+
|
313
|
+
return result_df
|
neurostats_API/utils/__init__.py
CHANGED
@@ -0,0 +1,26 @@
|
|
1
|
+
class YoY_Calculator:
|
2
|
+
def __init__(self):
|
3
|
+
pass
|
4
|
+
|
5
|
+
@classmethod
|
6
|
+
def cal_growth(cls, target_value: float, past_value: float, delta: int):
|
7
|
+
"""
|
8
|
+
計算成長率以及年化成長率
|
9
|
+
target_value: float,這個時間的數值
|
10
|
+
past_value: float,過去的這個時間數值
|
11
|
+
delta: int,代表隔了幾年/季 delta > 1 時改以年化成長率計算
|
12
|
+
"""
|
13
|
+
try:
|
14
|
+
if (delta > 1):
|
15
|
+
YoY = ((target_value / past_value)**(1 / delta)) - 1
|
16
|
+
|
17
|
+
else:
|
18
|
+
YoY = ((target_value - past_value) / past_value)
|
19
|
+
|
20
|
+
except Exception as e:
|
21
|
+
return None
|
22
|
+
|
23
|
+
if (isinstance(YoY, complex)): # 年化成長率有複數問題
|
24
|
+
return None
|
25
|
+
|
26
|
+
return YoY
|
@@ -20,7 +20,6 @@ class StatsProcessor:
|
|
20
20
|
"""
|
21
21
|
1. 讀檔: txt / yaml
|
22
22
|
2. 將巢狀dictionary / DataFrame扁平化
|
23
|
-
|
24
23
|
"""
|
25
24
|
|
26
25
|
@classmethod
|
@@ -215,3 +214,59 @@ class StatsProcessor:
|
|
215
214
|
return int(np.round(value).item())
|
216
215
|
else:
|
217
216
|
return value
|
217
|
+
|
218
|
+
@classmethod
|
219
|
+
def list_of_dict_to_dict(
|
220
|
+
cls,
|
221
|
+
data_list: list,
|
222
|
+
key: str = "",
|
223
|
+
keys: list = [],
|
224
|
+
delimeter: str = "_",
|
225
|
+
data_key: str = "Q"
|
226
|
+
):
|
227
|
+
"""
|
228
|
+
TEJ DB 用
|
229
|
+
List[Dict] -> Dict[Dict]
|
230
|
+
input:
|
231
|
+
data_list(List):
|
232
|
+
[
|
233
|
+
{ "data":
|
234
|
+
{
|
235
|
+
"year": 2021...
|
236
|
+
"season": 1,
|
237
|
+
"Q": {}...
|
238
|
+
|
239
|
+
}
|
240
|
+
}
|
241
|
+
]
|
242
|
+
|
243
|
+
key(str): 選擇哪一個key作為轉化後的index
|
244
|
+
delimeter(str): 多個key時要用甚麼分隔
|
245
|
+
return:
|
246
|
+
{
|
247
|
+
"2021" : {# Q下的資料} ...
|
248
|
+
}
|
249
|
+
|
250
|
+
or (keys = ['year', 'season'])
|
251
|
+
{
|
252
|
+
"2021Q2" : {}
|
253
|
+
}
|
254
|
+
"""
|
255
|
+
assert (key or keys), "func list_of_dict_to_dict must have argument \"key\" or \"keys\""
|
256
|
+
|
257
|
+
return_dict = {}
|
258
|
+
if (key):
|
259
|
+
keys = [key]
|
260
|
+
for data in data_list:
|
261
|
+
data = data['data']
|
262
|
+
|
263
|
+
pop_keys = []
|
264
|
+
|
265
|
+
for key in keys:
|
266
|
+
assert (key in data.keys())
|
267
|
+
pop_keys.append(str(data.pop(key)))
|
268
|
+
|
269
|
+
pop_key = delimeter.join(pop_keys)
|
270
|
+
return_dict[pop_key] = data[data_key]
|
271
|
+
|
272
|
+
return return_dict
|
@@ -1,12 +1,18 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
|
-
Name:
|
3
|
-
Version: 0.0.
|
2
|
+
Name: neurostats-API
|
3
|
+
Version: 0.0.15
|
4
4
|
Summary: The service of NeuroStats website
|
5
5
|
Home-page: https://github.com/NeurowattStats/NeuroStats_API.git
|
6
6
|
Author: JasonWang@Neurowatt
|
7
7
|
Author-email: jason@neurowatt.ai
|
8
8
|
Requires-Python: >=3.6
|
9
9
|
Description-Content-Type: text/markdown
|
10
|
+
Requires-Dist: numpy>=2.1.0
|
11
|
+
Requires-Dist: pandas>=2.2.0
|
12
|
+
Requires-Dist: pymongo
|
13
|
+
Requires-Dist: pytz
|
14
|
+
Requires-Dist: python-dotenv
|
15
|
+
Requires-Dist: yfinance
|
10
16
|
|
11
17
|
# neurostats_API
|
12
18
|
|
@@ -83,7 +89,7 @@ pip install neurostats-API
|
|
83
89
|
```Python
|
84
90
|
>>> import neurostats_API
|
85
91
|
>>> print(neurostats_API.__version__)
|
86
|
-
0.0.
|
92
|
+
0.0.15
|
87
93
|
```
|
88
94
|
|
89
95
|
### 得到最新一期的評價資料與歷年評價
|
@@ -667,7 +673,66 @@ fetcher.query()
|
|
667
673
|
|
668
674
|
請注意`range`, `last_range`, `52week_range`這三個項目型態為字串,其餘為float
|
669
675
|
|
676
|
+
|
677
|
+
## TEJ 相關
|
678
|
+
### 會計師簽證財務資料
|
679
|
+
```Python
|
680
|
+
from neurostats_API import FinanceReportFetcher
|
681
|
+
|
682
|
+
mongo_uri = <MongoDB 的 URI>
|
683
|
+
db_name = 'company' # 連接的DB名稱
|
684
|
+
collection_name = "TWN/AINVFQ1" # 連接的collection對象
|
685
|
+
|
686
|
+
fetcher = FinanceReportFetcher(
|
687
|
+
mongo_uri = mongo_uri,
|
688
|
+
db_name = db_name,
|
689
|
+
collection_name = collection_name
|
690
|
+
)
|
691
|
+
|
692
|
+
data = fetcher.get(
|
693
|
+
ticker = "2330" # 任意的股票代碼
|
694
|
+
fetch_mode = fetcher.YOY_NOCAL # 取得模式
|
695
|
+
start_date = "2005-01-01",
|
696
|
+
end_date = "2024-12-31",
|
697
|
+
report_type = "Q",
|
698
|
+
indexes = []
|
699
|
+
)
|
700
|
+
```
|
701
|
+
- `ticker`: 股票代碼
|
702
|
+
|
703
|
+
- `fetch_mode` : 取得模式,為`fetcher.YOY_NOCAL` 或 `fetcher.QOQ_NOCAL`
|
704
|
+
- `YOY_NOCAL`: 以end_date為準,取得與end_date為準同季的歷年資料,時間範圍以start_date為準
|
705
|
+
> 例如`start_date = "2020-07-01"`, `end_date = "2024-01-01"`,會回傳2020~2024的第一季資料
|
706
|
+
|
707
|
+
- `QOQ_NOCAL`: 時間範圍內的每季資料
|
708
|
+
|
709
|
+
- `start_date`: 開始日期,不設定時預設為`2005-01-01`
|
710
|
+
|
711
|
+
- `end_date`: 結束日期,不設定時預設為資料庫最新資料的日期
|
712
|
+
|
713
|
+
- `report_type`: 選擇哪種報告,預設為`Q`
|
714
|
+
- `A`: 當年累計
|
715
|
+
- `Q`: 當季數值
|
716
|
+
- `TTM`: 移動四季 (包括當季在內,往前累計四個季度)
|
717
|
+
|
718
|
+
- `indexes`: 選擇的column,需要以TEJ提供的欄位名稱為準,不提供時或提供`[]`會回傳全部column
|
719
|
+
- 範例輸入: `['bp41', 'bp51']`
|
720
|
+
|
721
|
+
[TEJ資料集連結](https://tquant.tejwin.com/%E8%B3%87%E6%96%99%E9%9B%86/)
|
722
|
+
請看 `會計師簽證財務資料`
|
723
|
+
|
724
|
+
#### 回傳資料
|
725
|
+
fetch_mode設定為`YOY_NOCAL`與`QOQ_NOCAL`下
|
726
|
+
為回傳pd.DataFrame,column名稱為<年份>Q<季>, row名稱為指定財報項目
|
727
|
+
|
670
728
|
## 版本紀錄
|
729
|
+
## 0.0.15
|
730
|
+
- TechFetcher中新增指數條件
|
731
|
+
|
732
|
+
- 新增tej_fetcher索取TEJ相關的資料
|
733
|
+
|
734
|
+
- package新增depensnecy,可以安裝需要的相關package
|
735
|
+
|
671
736
|
## 0.0.14
|
672
737
|
- 修改部分財報資料錯誤的乘以1000的問題
|
673
738
|
|
@@ -1,28 +1,30 @@
|
|
1
|
-
neurostats_API/__init__.py,sha256=
|
1
|
+
neurostats_API/__init__.py,sha256=oEkbIWbrC6-8sBPEJQXg0QYoz3TNZtYXhSTEO6d0JcU,261
|
2
2
|
neurostats_API/cli.py,sha256=UJSWLIw03P24p-gkBb6JSEI5dW5U12UvLf1L8HjQD-o,873
|
3
3
|
neurostats_API/main.py,sha256=QcsfmWivg2Dnqw3MTJWiI0QvEiRs0VuH-BjwQHFCv00,677
|
4
|
-
neurostats_API/fetchers/__init__.py,sha256=
|
4
|
+
neurostats_API/fetchers/__init__.py,sha256=B4aBwVzf_X-YieEf3fZteU0qmBPVIB9VjrmkyWhLK18,489
|
5
5
|
neurostats_API/fetchers/balance_sheet.py,sha256=sQv4Gk5uoKURLEdh57YknOQWiyVwaXJ2Mw75jxNqUS0,5804
|
6
|
-
neurostats_API/fetchers/base.py,sha256=
|
6
|
+
neurostats_API/fetchers/base.py,sha256=4YS8MJR3u9Sg6dKX7QoCYuqNeQaoYHIlvPm5x8VQ72U,4882
|
7
7
|
neurostats_API/fetchers/cash_flow.py,sha256=TY7VAWVXkj5-mzH5Iu0sIE-oV8MvGmmDy0URNotNV1E,7614
|
8
8
|
neurostats_API/fetchers/finance_overview.py,sha256=PxUdWY0x030olYMLcCHDBn068JLmCE2RTOce1dxs5vM,27753
|
9
9
|
neurostats_API/fetchers/institution.py,sha256=UrcBc6t7u7CnEwUsf6YmLbbJ8VncdWpq8bCz17q2dgs,11168
|
10
10
|
neurostats_API/fetchers/margin_trading.py,sha256=lQImtNdvaBoSlKhJvQ3DkH3HjSSgKRJz4ZZpyR5-Z4I,10433
|
11
11
|
neurostats_API/fetchers/month_revenue.py,sha256=nixX2llzjCFr2m2YVjxrSfkBusnZPrPb2dRDq1XLGhw,4251
|
12
12
|
neurostats_API/fetchers/profit_lose.py,sha256=EN9Y0iamcAaHMZdjHXO6b_2buLnORssf8ZS7A0hi74s,5896
|
13
|
-
neurostats_API/fetchers/tech.py,sha256=
|
13
|
+
neurostats_API/fetchers/tech.py,sha256=Hol1bcwJ_ERcnoTXNWlqqaWOuzdl7MeiAjCvzQMZDTg,12269
|
14
|
+
neurostats_API/fetchers/tej_finance_report.py,sha256=VDP0Lx2ErCgIBBz7nbquC1ugkcnj6p7ehM2JtFInjsQ,10218
|
14
15
|
neurostats_API/fetchers/value_invest.py,sha256=_eQxuEnIYvksb06QHixGK29Gnwr_3xmI6Tu7dv4J__E,5769
|
15
16
|
neurostats_API/tools/balance_sheet.yaml,sha256=6XygNG_Ybb1Xkk1e39LMLKr7ATvaCP3xxuwFbgNl6dA,673
|
16
17
|
neurostats_API/tools/cash_flow_percentage.yaml,sha256=fk2Z4eb1JjGFvP134eJatHacB7BgTkBenhDJr83w8RE,1345
|
17
18
|
neurostats_API/tools/finance_overview_dict.yaml,sha256=B9nV75StXkrF3yv2-eezzitlJ38eEK86RD_VY6588gQ,2884
|
18
19
|
neurostats_API/tools/profit_lose.yaml,sha256=iyp9asYJ04vAxk_HBUDse_IBy5oVvYHpwsyACg5YEeg,3029
|
19
20
|
neurostats_API/tools/seasonal_data_field_dict.txt,sha256=X8yc_el6p8BH_3FikTqBVFGsvWdXT6MHXLfKfi44334,8491
|
20
|
-
neurostats_API/utils/__init__.py,sha256=
|
21
|
-
neurostats_API/utils/
|
21
|
+
neurostats_API/utils/__init__.py,sha256=0tJCRmlJq2aDwcNNW-oEaA9H0OxTJMFvjpVYtG4AvZU,186
|
22
|
+
neurostats_API/utils/calculate_value.py,sha256=lUKSsWU76XRmDUcmi4eDjoQxjb3vWpAAKInF9w49VNI,782
|
23
|
+
neurostats_API/utils/data_process.py,sha256=A--dzOsu42jRxqqCD41gTtjE5rhEBYmhB6y-AnCvo5U,8986
|
22
24
|
neurostats_API/utils/datetime.py,sha256=XJya4G8b_-ZOaBbMXgQjWh2MC4wc-o6goQ7EQJQMWrQ,773
|
23
25
|
neurostats_API/utils/db_client.py,sha256=OYe6yazcR4Aa6jYmy47JrryUeh2NnKGqY2K_lSZe6i8,455
|
24
26
|
neurostats_API/utils/fetcher.py,sha256=VbrUhjA-GG5AyjPX2SHtFIbZM4dm3jo0RgZzuCbb_Io,40927
|
25
|
-
neurostats_API-0.0.
|
26
|
-
neurostats_API-0.0.
|
27
|
-
neurostats_API-0.0.
|
28
|
-
neurostats_API-0.0.
|
27
|
+
neurostats_API-0.0.15.dist-info/METADATA,sha256=btfdGRam5QpUHFFiA_UPWYeZuAqAMYkEJ0Ufod399T4,27959
|
28
|
+
neurostats_API-0.0.15.dist-info/WHEEL,sha256=bFJAMchF8aTQGUgMZzHJyDDMPTO3ToJ7x23SLJa1SVo,92
|
29
|
+
neurostats_API-0.0.15.dist-info/top_level.txt,sha256=nSlQPMG0VtXivJyedp4Bkf86EOy2TpW10VGxolXrqnU,15
|
30
|
+
neurostats_API-0.0.15.dist-info/RECORD,,
|
File without changes
|