PyPI - datamule - Versions diffs - 0.381__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

datamule 0.381py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (73) hide show

datamule/__init__.py +46 -86
datamule/book.py +16 -0
datamule/config.py +29 -0
datamule/data/company_former_names.csv +8148 -8148
datamule/data/company_metadata.csv +10049 -10049
datamule/data/company_tickers.csv +9999 -10168
datamule/data/sec-glossary.csv +728 -728
datamule/data/xbrl_descriptions.csv +10024 -10024
datamule/document.py +278 -0
datamule/downloader/downloader.py +374 -0
datamule/downloader/premiumdownloader.py +335 -0
datamule/helper.py +123 -136
datamule/mapping_dicts/txt_mapping_dicts.py +232 -0
datamule/mapping_dicts/xml_mapping_dicts.py +19 -0
datamule/monitor.py +238 -0
datamule/mulebot/__init__.py +1 -1
datamule/mulebot/helper.py +34 -34
datamule/mulebot/mulebot.py +129 -129
datamule/mulebot/mulebot_server/server.py +86 -86
datamule/mulebot/mulebot_server/static/css/minimalist.css +173 -173
datamule/mulebot/mulebot_server/static/scripts/artifacts.js +67 -67
datamule/mulebot/mulebot_server/static/scripts/chat.js +91 -91
datamule/mulebot/mulebot_server/static/scripts/filingArtifacts.js +55 -55
datamule/mulebot/mulebot_server/static/scripts/listArtifacts.js +14 -14
datamule/mulebot/mulebot_server/static/scripts/main.js +56 -56
datamule/mulebot/mulebot_server/static/scripts/prefilledPrompt.js +26 -26
datamule/mulebot/mulebot_server/static/scripts/suggestions.js +46 -46
datamule/mulebot/mulebot_server/static/scripts/tableArtifacts.js +128 -128
datamule/mulebot/mulebot_server/static/scripts/utils.js +27 -27
datamule/mulebot/mulebot_server/templates/chat-minimalist.html +90 -90
datamule/mulebot/search.py +51 -51
datamule/mulebot/tools.py +82 -82
datamule/packageupdater.py +207 -0
datamule/portfolio.py +106 -0
datamule/submission.py +76 -0
datamule-1.0.0.dist-info/METADATA +27 -0
datamule-1.0.0.dist-info/RECORD +40 -0
{datamule-0.381.dist-info → datamule-1.0.0.dist-info}/WHEEL +1 -1
datamule/data/filing_types.csv +0 -485
datamule/data/ftd_locations.csv +0 -388
datamule/datamule_api.py +0 -21
datamule/dataset_builder/_init.py +0 -1
datamule/dataset_builder/dataset_builder.py +0 -260
datamule/downloader/__init__.py +0 -0
datamule/downloader/dropbox_downloader.py +0 -225
datamule/downloader/ftd.py +0 -216
datamule/downloader/information_table_13f.py +0 -231
datamule/downloader/sec_downloader.py +0 -635
datamule/filing_viewer/__init__.py +0 -1
datamule/filing_viewer/filing_viewer.py +0 -256
datamule/global_vars.py +0 -202
datamule/parser/__init__.py +0 -1
datamule/parser/basic_10k_parser.py +0 -82
datamule/parser/basic_10q_parser.py +0 -73
datamule/parser/basic_13d_parser.py +0 -58
datamule/parser/basic_13g_parser.py +0 -61
datamule/parser/basic_8k_parser.py +0 -84
datamule/parser/company_concepts_parser.py +0 -0
datamule/parser/form_d_parser.py +0 -70
datamule/parser/generalized_item_parser.py +0 -78
datamule/parser/generalized_xml_parser.py +0 -0
datamule/parser/helper.py +0 -75
datamule/parser/information_table_parser_13fhr.py +0 -41
datamule/parser/insider_trading_parser.py +0 -158
datamule/parser/mappings.py +0 -95
datamule/parser/n_port_p_parser.py +0 -70
datamule/parser/sec_parser.py +0 -79
datamule/parser/sgml_parser.py +0 -180
datamule/sec_filing.py +0 -126
datamule/sec_search.py +0 -20
datamule-0.381.dist-info/METADATA +0 -132
datamule-0.381.dist-info/RECORD +0 -61
{datamule-0.381.dist-info → datamule-1.0.0.dist-info}/top_level.txt +0 -0

datamule/mulebot/mulebot.py CHANGED Viewed

@@ -1,130 +1,130 @@
-import openai
-import json
-from datamule.helper import identifier_to_cik
-from datamule import Downloader, Parser
-from .search import search_filing
-from .tools import tools, return_title_tool
-from .helper import get_company_concept, select_dict_by_title
-downloader = Downloader()
-parser = Parser()
-class MuleBot:
-    def __init__(self, api_key):
-        self.client = openai.OpenAI(api_key=api_key)
-        self.messages = [
-            {"role": "system", "content": "You are a helpful, but concise, assistant to assist with questions related to the Securities and Exchanges Commission. You are allowed to guess tickers."}
-        ]
-        self.total_tokens = 0
-    def process_message(self, user_input):
-        new_message_chain = self.messages
-        new_message_chain.append({"role": "user", "content": user_input})
-        try:
-            response = self.client.chat.completions.create(
-                model="gpt-4o-mini",
-                messages=new_message_chain,
-                tools=tools,
-                tool_choice="auto"
-            )
-            self.total_tokens += response.usage.total_tokens
-            assistant_message = response.choices[0].message
-            if assistant_message.content is None:
-                assistant_message.content = "I'm processing your request."
-            new_message_chain.append({"role": "assistant", "content": assistant_message.content})
-            tool_calls = assistant_message.tool_calls
-            if tool_calls is None:
-                return {'key':'text','value':assistant_message.content}
-            else:
-                for tool_call in tool_calls:
-                    print(f"Tool call: {tool_call.function.name}")
-                    if tool_call.function.name == "identifier_to_cik":
-                        function_args = json.loads(tool_call.function.arguments)
-                        print(f"Function args: {function_args}")
-                        cik = identifier_to_cik(function_args["ticker"])
-                        return {'key':'text','value':cik}
-                    elif tool_call.function.name == "get_company_concept":
-                        function_args = json.loads(tool_call.function.arguments)
-                        print(f"Function args: {function_args}")
-                        table_dict_list = get_company_concept(function_args["ticker"])
-                        return {'key':'table','value':table_dict_list}
-                    elif tool_call.function.name == "get_filing_urls":
-                        function_args = json.loads(tool_call.function.arguments)
-                        print(f"Function args: {function_args}")
-                        result = downloader.download(**function_args,return_urls=True)
-                        return {'key':'list','value':result}
-                    elif tool_call.function.name == "find_filing_section_by_title":
-                        function_args = json.loads(tool_call.function.arguments)
-                        print(f"Function args: {function_args}")
-                        # Parse the filing
-                        data = parser.parse_filing(function_args["url"])
-                        # find possible matches
-                        section_dicts = search_filing(query = function_args["title"], nested_dict =data, score_cutoff=0.3)
-                        # feed titles back to assistant
-                        titles = [section['title'] for section in section_dicts]
-                        new_message_chain.append({"role": "assistant", "content": f"Which of these titles is closest: {','.join(titles)}"})
-                        title_response = self.client.chat.completions.create(
-                            model="gpt-4o-mini",
-                            messages=new_message_chain,
-                            tools=[return_title_tool],
-                            tool_choice="required"
-                        )
-                        title_tool_call = title_response.choices[0].message.tool_calls[0]
-                        title = json.loads(title_tool_call.function.arguments)['title']
-                        print(f"Selected title: {title}")
-                        #print(f"Possible titles: {titles}")
-                        # select the section
-                        #section_dict = select_dict_by_title(data, title)
-                        # probably want to return full dict, and section label
-                        return {'key':'filing','value':{'data':data,'title':title}}
-            return {'key':'text','value':'No tool call was made.'}
-        except Exception as e:
-            return f"An error occurred: {str(e)}"
-    def get_total_tokens(self):
-        return self.total_tokens
-    def run(self):
-        """Basic chatbot loop"""
-        print("MuleBot: Hello! I'm here to assist you with questions related to the Securities and Exchange Commission. Type 'quit', 'exit', or 'bye' to end the conversation.")
-        while True:
-            user_input = input("You: ")
-            if user_input.lower() in ['quit', 'exit', 'bye']:
-                print("MuleBot: Goodbye!")
-                break
-            response = self.process_message(user_input)
-            response_type = response['key']
-            if response_type == 'text':
-                value = response['value']
-                print(value)
-            elif response_type == 'table':
-                value = response['value']
-                print(value)
-            elif response_type == 'list':
-                value = response['value']
-                print(value)
-            elif response_type == 'filing':
-                value = response['value']
-                print(value)
-            else:
-                value = response['value']
+import openai
+import json
+from datamule.helper import identifier_to_cik
+from datamule import Downloader, Parser
+from .search import search_filing
+from .tools import tools, return_title_tool
+from .helper import get_company_concept, select_dict_by_title
+downloader = Downloader()
+parser = Parser()
+class MuleBot:
+    def __init__(self, api_key):
+        self.client = openai.OpenAI(api_key=api_key)
+        self.messages = [
+            {"role": "system", "content": "You are a helpful, but concise, assistant to assist with questions related to the Securities and Exchanges Commission. You are allowed to guess tickers."}
+        ]
+        self.total_tokens = 0
+    def process_message(self, user_input):
+        new_message_chain = self.messages
+        new_message_chain.append({"role": "user", "content": user_input})
+        try:
+            response = self.client.chat.completions.create(
+                model="gpt-4o-mini",
+                messages=new_message_chain,
+                tools=tools,
+                tool_choice="auto"
+            )
+            self.total_tokens += response.usage.total_tokens
+            assistant_message = response.choices[0].message
+            if assistant_message.content is None:
+                assistant_message.content = "I'm processing your request."
+            new_message_chain.append({"role": "assistant", "content": assistant_message.content})
+            tool_calls = assistant_message.tool_calls
+            if tool_calls is None:
+                return {'key':'text','value':assistant_message.content}
+            else:
+                for tool_call in tool_calls:
+                    print(f"Tool call: {tool_call.function.name}")
+                    if tool_call.function.name == "identifier_to_cik":
+                        function_args = json.loads(tool_call.function.arguments)
+                        print(f"Function args: {function_args}")
+                        cik = identifier_to_cik(function_args["ticker"])
+                        return {'key':'text','value':cik}
+                    elif tool_call.function.name == "get_company_concept":
+                        function_args = json.loads(tool_call.function.arguments)
+                        print(f"Function args: {function_args}")
+                        table_dict_list = get_company_concept(function_args["ticker"])
+                        return {'key':'table','value':table_dict_list}
+                    elif tool_call.function.name == "get_filing_urls":
+                        function_args = json.loads(tool_call.function.arguments)
+                        print(f"Function args: {function_args}")
+                        result = downloader.download(**function_args,return_urls=True)
+                        return {'key':'list','value':result}
+                    elif tool_call.function.name == "find_filing_section_by_title":
+                        function_args = json.loads(tool_call.function.arguments)
+                        print(f"Function args: {function_args}")
+                        # Parse the filing
+                        data = parser.parse_filing(function_args["url"])
+                        # find possible matches
+                        section_dicts = search_filing(query = function_args["title"], nested_dict =data, score_cutoff=0.3)
+                        # feed titles back to assistant
+                        titles = [section['title'] for section in section_dicts]
+                        new_message_chain.append({"role": "assistant", "content": f"Which of these titles is closest: {','.join(titles)}"})
+                        title_response = self.client.chat.completions.create(
+                            model="gpt-4o-mini",
+                            messages=new_message_chain,
+                            tools=[return_title_tool],
+                            tool_choice="required"
+                        )
+                        title_tool_call = title_response.choices[0].message.tool_calls[0]
+                        title = json.loads(title_tool_call.function.arguments)['title']
+                        print(f"Selected title: {title}")
+                        #print(f"Possible titles: {titles}")
+                        # select the section
+                        #section_dict = select_dict_by_title(data, title)
+                        # probably want to return full dict, and section label
+                        return {'key':'filing','value':{'data':data,'title':title}}
+            return {'key':'text','value':'No tool call was made.'}
+        except Exception as e:
+            return f"An error occurred: {str(e)}"
+    def get_total_tokens(self):
+        return self.total_tokens
+    def run(self):
+        """Basic chatbot loop"""
+        print("MuleBot: Hello! I'm here to assist you with questions related to the Securities and Exchange Commission. Type 'quit', 'exit', or 'bye' to end the conversation.")
+        while True:
+            user_input = input("You: ")
+            if user_input.lower() in ['quit', 'exit', 'bye']:
+                print("MuleBot: Goodbye!")
+                break
+            response = self.process_message(user_input)
+            response_type = response['key']
+            if response_type == 'text':
+                value = response['value']
+                print(value)
+            elif response_type == 'table':
+                value = response['value']
+                print(value)
+            elif response_type == 'list':
+                value = response['value']
+                print(value)
+            elif response_type == 'filing':
+                value = response['value']
+                print(value)
+            else:
+                value = response['value']
                 print(value)

datamule/mulebot/mulebot_server/server.py CHANGED Viewed

@@ -1,87 +1,87 @@
-import os
-from flask import Flask, request, jsonify, render_template
-from datamule.mulebot import MuleBot
-from datamule.filing_viewer import create_interactive_filing, create_valid_id
-class MuleBotServer:
-    def __init__(self, template='chat-minimalist.html'):
-        template_dir = os.path.abspath(os.path.join(os.path.dirname(__file__), 'templates'))
-        static_dir = os.path.abspath(os.path.join(os.path.dirname(__file__), 'static'))
-        self.app = Flask(__name__, template_folder=template_dir, static_folder=static_dir)
-        self.mulebot = None
-        self.template = template
-        self.setup_routes()
-    def setup_routes(self):
-        @self.app.route('/')
-        def home():
-            return render_template(self.template)
-        @self.app.route('/chat-with-prompt')
-        def chat_with_prompt():
-            prefilled_prompt = request.args.get('prompt', '')
-            return render_template(self.template, prefilled_prompt=prefilled_prompt)
-        @self.app.route('/chat', methods=['POST'])
-        def chat():
-            user_input = request.json['message']
-            # Process the message using MuleBot's process_message method
-            response = self.mulebot.process_message(user_input)
-            response_type = response['key']
-            # Prepare the response based on the type
-            if response_type == 'text':
-                # If response type is text, add it to the chat
-                chat_response = {
-                    'type': 'text',
-                    'content': response['value']
-                }
-            elif response_type == 'table':
-                # If response type is table, prepare it for the artifact window
-                chat_response = {
-                    'type': 'artifact',
-                    'content': response['value'],
-                    'artifact_type': 'artifact-table'
-                }
-            elif response_type == 'list':
-                chat_response = {
-                    'type': 'artifact',
-                    'content': response['value'],
-                    'artifact_type': 'artifact-list'
-                }
-            elif response_type == 'filing':
-                data = response['value']['data']
-                title = response['value']['title']
-                section_id = create_valid_id(title)
-                # create a filing viewer display
-                html = create_interactive_filing(data)
-                # we'll need to display the filing viewer in the artifact window, with a json export option
-                chat_response = {
-                    'type': 'artifact',
-                    'content': html,
-                    'data': data,
-                    'section_id': section_id,
-                    'artifact_type': 'artifact-filing'
-                }
-            else:
-                # Handle other types of responses if needed
-                chat_response = {
-                    'type': 'unknown',
-                    'content': 'Unsupported response type'
-                }
-            return jsonify({
-                'response': chat_response,
-                'total_tokens': self.mulebot.get_total_tokens()
-            })
-    def set_api_key(self, api_key):
-        self.mulebot = MuleBot(api_key)
-    def run(self, debug=False, host='0.0.0.0', port=5000):
-        if not self.mulebot:
-            raise ValueError("API key not set. Please call set_api_key() before running the server.")
+import os
+from flask import Flask, request, jsonify, render_template
+from datamule.mulebot import MuleBot
+from datamule.filing_viewer import create_interactive_filing, create_valid_id
+class MuleBotServer:
+    def __init__(self, template='chat-minimalist.html'):
+        template_dir = os.path.abspath(os.path.join(os.path.dirname(__file__), 'templates'))
+        static_dir = os.path.abspath(os.path.join(os.path.dirname(__file__), 'static'))
+        self.app = Flask(__name__, template_folder=template_dir, static_folder=static_dir)
+        self.mulebot = None
+        self.template = template
+        self.setup_routes()
+    def setup_routes(self):
+        @self.app.route('/')
+        def home():
+            return render_template(self.template)
+        @self.app.route('/chat-with-prompt')
+        def chat_with_prompt():
+            prefilled_prompt = request.args.get('prompt', '')
+            return render_template(self.template, prefilled_prompt=prefilled_prompt)
+        @self.app.route('/chat', methods=['POST'])
+        def chat():
+            user_input = request.json['message']
+            # Process the message using MuleBot's process_message method
+            response = self.mulebot.process_message(user_input)
+            response_type = response['key']
+            # Prepare the response based on the type
+            if response_type == 'text':
+                # If response type is text, add it to the chat
+                chat_response = {
+                    'type': 'text',
+                    'content': response['value']
+                }
+            elif response_type == 'table':
+                # If response type is table, prepare it for the artifact window
+                chat_response = {
+                    'type': 'artifact',
+                    'content': response['value'],
+                    'artifact_type': 'artifact-table'
+                }
+            elif response_type == 'list':
+                chat_response = {
+                    'type': 'artifact',
+                    'content': response['value'],
+                    'artifact_type': 'artifact-list'
+                }
+            elif response_type == 'filing':
+                data = response['value']['data']
+                title = response['value']['title']
+                section_id = create_valid_id(title)
+                # create a filing viewer display
+                html = create_interactive_filing(data)
+                # we'll need to display the filing viewer in the artifact window, with a json export option
+                chat_response = {
+                    'type': 'artifact',
+                    'content': html,
+                    'data': data,
+                    'section_id': section_id,
+                    'artifact_type': 'artifact-filing'
+                }
+            else:
+                # Handle other types of responses if needed
+                chat_response = {
+                    'type': 'unknown',
+                    'content': 'Unsupported response type'
+                }
+            return jsonify({
+                'response': chat_response,
+                'total_tokens': self.mulebot.get_total_tokens()
+            })
+    def set_api_key(self, api_key):
+        self.mulebot = MuleBot(api_key)
+    def run(self, debug=False, host='0.0.0.0', port=5000):
+        if not self.mulebot:
+            raise ValueError("API key not set. Please call set_api_key() before running the server.")
         self.app.run(debug=debug, host=host, port=port)

datamule 0.381__py3-none-any.whl → 1.0.0__py3-none-any.whl

datamule 0.381py3-none-any.whl → 1.0.0py3-none-any.whl