itchfeed 1.0.0__py3-none-any.whl → 1.0.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
itch/parser.py CHANGED
@@ -1,180 +1,173 @@
1
- from queue import Queue
2
- from typing import BinaryIO, List
3
-
4
- from itch import messages as msg
5
- from itch.messages import MarketMessage
6
-
7
- class MessageParser(object):
8
- """
9
- A market message parser for ITCH 5.0 data.
10
-
11
- """
12
-
13
- def __init__(self, message_type: bytes = msg.MESSAGES):
14
- self.message_type = message_type
15
-
16
- def read_message_from_file(
17
- self,
18
- file: BinaryIO,
19
- cachesize: int = 4096,
20
- ) -> List[MarketMessage]:
21
- max_message_size = 52
22
- file_end_reached = False
23
-
24
- data_buffer = file.read(cachesize)
25
- buffer_len = len(data_buffer)
26
- messages: List[MarketMessage] = []
27
-
28
- while not file_end_reached:
29
- if buffer_len < 2:
30
- new_data = file.read(cachesize)
31
- if not new_data:
32
- break
33
- data_buffer += new_data
34
- buffer_len = len(data_buffer)
35
- continue
36
-
37
- if data_buffer[0:1] != b"\x00":
38
- raise ValueError(
39
- "Unexpected byte: " + str(data_buffer[0:1], encoding="ascii")
40
- )
41
-
42
- message_len = data_buffer[1]
43
- total_len = 2 + message_len
44
-
45
- if buffer_len < total_len:
46
- # Wait for more data if message is incomplete
47
- new_data = file.read(cachesize)
48
- if not new_data:
49
- break
50
- data_buffer += new_data
51
- buffer_len = len(data_buffer)
52
- continue
53
- message_data = data_buffer[2:total_len]
54
- message = self.get_message_type(message_data)
55
-
56
- if message.message_type in self.message_type:
57
- messages.append(message)
58
-
59
- if message.message_type == b"S": # System message
60
- if message.event_code == b"C": # End of messages
61
- break
62
-
63
- # Update buffer
64
- data_buffer = data_buffer[total_len:]
65
- buffer_len = len(data_buffer)
66
-
67
- if buffer_len < max_message_size and not file_end_reached:
68
- new_data = file.read(cachesize)
69
- if not new_data:
70
- file_end_reached = True
71
- else:
72
- data_buffer += new_data
73
- buffer_len = len(data_buffer)
74
-
75
- return messages
76
-
77
- def read_message_from_bytes(self, data: bytes):
78
- """
79
- Process one or multiple ITCH binary messages from a raw bytes input.
80
-
81
- Args:
82
- data (bytes): Binary blob containing one or more ITCH messages.
83
-
84
- Returns:
85
- Queue: A queue containing parsed ITCH message objects.
86
-
87
- Notes:
88
- - Each message must be prefixed with a 0x00 header and a length byte.
89
- - No buffering is done here — this is meant for real-time decoding.
90
- """
91
-
92
- offset = 0
93
- messages = Queue()
94
- while offset + 2 <= len(data):
95
- # Each message starts with: 1-byte header (0x00) 1-byte length
96
- if data[offset : offset + 1] != b"\x00":
97
- raise ValueError(
98
- f"Unexpected start byte at offset {offset}: "
99
- f"{str(data[offset : offset + 1], encoding='ascii')}"
100
- )
101
-
102
- msg_len = data[offset + 1]
103
- total_len = 2 + msg_len
104
-
105
- if offset + total_len > len(data):
106
- break
107
-
108
- raw_msg = data[offset + 2 : offset + total_len]
109
- message = self.get_message_type(raw_msg)
110
-
111
- if message.message_type in self.message_type:
112
- messages.put(message)
113
-
114
- if message.message_type == b"S": # System message
115
- if message.event_code == b"C": # End of messages
116
- break
117
-
118
- offset += total_len
119
-
120
- return messages
121
-
122
- def get_message_type(self, message: bytes):
123
- """
124
- Take an entire bytearray and return the appropriate ITCH message
125
- instance based on the message type indicator (first byte of the message).
126
-
127
- All message type indicators are single ASCII characters.
128
- """
129
- message_type = message[0:1]
130
- match message_type:
131
- case b"S":
132
- return msg.SystemEventMessage(message)
133
- case b"R":
134
- return msg.StockDirectoryMessage(message)
135
- case b"H":
136
- return msg.StockTradingActionMessage(message)
137
- case b"Y":
138
- return msg.RegSHOMessage(message)
139
- case b"L":
140
- return msg.MarketParticipantPositionMessage(message)
141
- case b"V":
142
- return msg.MWCBDeclineLeveMessage(message)
143
- case b"W":
144
- return msg.MWCBStatusMessage(message)
145
- case b"K":
146
- return msg.IPOQuotingPeriodUpdateMessage(message)
147
- case b"J":
148
- return msg.LULDAuctionCollarMessage(message)
149
- case b"h":
150
- return msg.OperationalHaltMessage(message)
151
- case b"A":
152
- return msg.AddOrderNoMPIAttributionMessage(message)
153
- case b"F":
154
- return msg.AddOrderMPIDAttribution(message)
155
- case b"E":
156
- return msg.OrderExecutedMessage(message)
157
- case b"C":
158
- return msg.OrderExecutedWithPriceMessage(message)
159
- case b"X":
160
- return msg.OrderCancelMessage(message)
161
- case b"D":
162
- return msg.OrderDeleteMessage(message)
163
- case b"U":
164
- return msg.OrderReplaceMessage(message)
165
- case b"P":
166
- return msg.NonCrossTradeMessage(message)
167
- case b"Q":
168
- return msg.CrossTradeMessage(message)
169
- case b"B":
170
- return msg.BrokenTradeMessage(message)
171
- case b"I":
172
- return msg.NOIIMessage(message)
173
- case b"N":
174
- return msg.RetailPriceImprovementIndicator(message)
175
- case b"O":
176
- return msg.DLCRMessage(message)
177
- case _:
178
- raise ValueError(
179
- f"Unknown message type: {message_type.decode(encoding='ascii')}"
180
- )
1
+ from queue import Queue
2
+ from typing import BinaryIO, List
3
+
4
+ from itch.messages import MESSAGES, MarketMessage
5
+ from itch.messages import messages as msgs
6
+
7
+
8
+ class MessageParser(object):
9
+ """
10
+ A market message parser for ITCH 5.0 data.
11
+
12
+ """
13
+
14
+ def __init__(self, message_type: bytes = MESSAGES):
15
+ self.message_type = message_type
16
+
17
+ def read_message_from_file(
18
+ self,
19
+ file: BinaryIO,
20
+ cachesize: int = 4096,
21
+ ) -> List[MarketMessage]:
22
+ """
23
+ Reads and parses market messages from a binary file-like object.
24
+
25
+ This method processes binary data in chunks, extracts individual messages
26
+ according to a specific format, and returns a list of successfully decoded
27
+ MarketMessage objects. Parsing stops either when the end of the file is
28
+ reached or when a system message with an end-of-messages event code is encountered.
29
+
30
+ Args:
31
+ file (BinaryIO):
32
+ A binary file-like object (opened in binary mode) from which market messages are read.
33
+ cachesize (int, optional):
34
+ The size (in bytes) of each data chunk read from the file. Defaults to 4096 bytes.
35
+
36
+ Returns:
37
+ List[MarketMessage]:
38
+ A list of parsed MarketMessage objects that match the allowed message types
39
+ defined in self.message_type.
40
+
41
+ Raises:
42
+ ValueError:
43
+ If a message does not start with the expected 0x00 byte, indicating
44
+ an unexpected file format or possible corruption.
45
+
46
+ Message Format:
47
+ - Each message starts with a 0x00 byte.
48
+ - The following byte specifies the message length.
49
+ - The complete message consists of the first 2 bytes and 'message length' bytes of body.
50
+ - If a system message (message_type == b'S') with event_code == b'C' is encountered,
51
+ parsing stops immediately.
52
+
53
+ Example:
54
+ >>> with open('market_data.bin', 'rb') as binary_file:
55
+ >>> messages = reader.read_message_from_file(binary_file, cachesize=4096)
56
+ >>> for message in messages:
57
+ >>> print(message)
58
+ """
59
+ max_message_size = 52
60
+ file_end_reached = False
61
+
62
+ data_buffer = file.read(cachesize)
63
+ buffer_len = len(data_buffer)
64
+ messages: List[MarketMessage] = []
65
+
66
+ while not file_end_reached:
67
+ if buffer_len < 2:
68
+ new_data = file.read(cachesize)
69
+ if not new_data:
70
+ break
71
+ data_buffer += new_data
72
+ buffer_len = len(data_buffer)
73
+ continue
74
+
75
+ if data_buffer[0:1] != b"\x00":
76
+ raise ValueError(
77
+ "Unexpected byte: " + str(data_buffer[0:1], encoding="ascii")
78
+ )
79
+
80
+ message_len = data_buffer[1]
81
+ total_len = 2 + message_len
82
+
83
+ if buffer_len < total_len:
84
+ # Wait for more data if message is incomplete
85
+ new_data = file.read(cachesize)
86
+ if not new_data:
87
+ break
88
+ data_buffer += new_data
89
+ buffer_len = len(data_buffer)
90
+ continue
91
+ message_data = data_buffer[2:total_len]
92
+ message = self.get_message_type(message_data)
93
+
94
+ if message.message_type in self.message_type:
95
+ messages.append(message)
96
+
97
+ if message.message_type == b"S": # System message
98
+ if message.event_code == b"C": # End of messages
99
+ break
100
+
101
+ # Update buffer
102
+ data_buffer = data_buffer[total_len:]
103
+ buffer_len = len(data_buffer)
104
+
105
+ if buffer_len < max_message_size and not file_end_reached:
106
+ new_data = file.read(cachesize)
107
+ if not new_data:
108
+ file_end_reached = True
109
+ else:
110
+ data_buffer += new_data
111
+ buffer_len = len(data_buffer)
112
+
113
+ return messages
114
+
115
+ def read_message_from_bytes(self, data: bytes):
116
+ """
117
+ Process one or multiple ITCH binary messages from a raw bytes input.
118
+
119
+ Args:
120
+ data (bytes): Binary blob containing one or more ITCH messages.
121
+
122
+ Returns:
123
+ Queue: A queue containing parsed ITCH message objects.
124
+
125
+ Notes:
126
+ - Each message must be prefixed with a 0x00 header and a length byte.
127
+ - No buffering is done here this is meant for real-time decoding.
128
+ """
129
+
130
+ offset = 0
131
+ messages = Queue()
132
+ while offset + 2 <= len(data):
133
+ # Each message starts with: 1-byte header (0x00) 1-byte length
134
+ if data[offset : offset + 1] != b"\x00":
135
+ raise ValueError(
136
+ f"Unexpected start byte at offset {offset}: "
137
+ f"{str(data[offset : offset + 1], encoding='ascii')}"
138
+ )
139
+
140
+ msg_len = data[offset + 1]
141
+ total_len = 2 + msg_len
142
+
143
+ if offset + total_len > len(data):
144
+ break
145
+
146
+ raw_msg = data[offset + 2 : offset + total_len]
147
+ message = self.get_message_type(raw_msg)
148
+
149
+ if message.message_type in self.message_type:
150
+ messages.put(message)
151
+
152
+ if message.message_type == b"S": # System message
153
+ if message.event_code == b"C": # End of messages
154
+ break
155
+
156
+ offset += total_len
157
+
158
+ return messages
159
+
160
+ def get_message_type(self, message: bytes):
161
+ """
162
+ Take an entire bytearray and return the appropriate ITCH message
163
+ instance based on the message type indicator (first byte of the message).
164
+
165
+ All message type indicators are single ASCII characters.
166
+ """
167
+ message_type = message[0:1]
168
+ try:
169
+ return msgs[message_type](message)
170
+ except Exception:
171
+ raise ValueError(
172
+ f"Unknown message type: {message_type.decode(encoding='ascii')}"
173
+ )