@@ -26,6 +26,7 @@ def __init__(self, data_iter):
26
26
self .data_iter = data_iter
27
27
self .i = 0
28
28
self .chunk = b""
29
+ self .last_char = None
29
30
30
31
def read (self ):
31
32
"""Read the next character from the stream."""
@@ -39,16 +40,37 @@ def read(self):
39
40
self .i += 1
40
41
return char
41
42
42
- def fast_forward (self , closer ):
43
- """Read through the stream until the character is ``closer``, ``]``
43
+ def fast_forward (self , closer , * , return_object = False ):
44
+ """
45
+ Read through the stream until the character is ``closer``, ``]``
44
46
(ending a list) or ``}`` (ending an object.) Intermediate lists and
45
- objects are skipped."""
47
+ objects are skipped.
48
+
49
+ :param str closer: the character to read until
50
+ :param bool return_object: read until the closer,
51
+ and then parse the data and return as an object
52
+ """
53
+
46
54
closer = ord (closer )
47
55
close_stack = [closer ]
48
56
count = 0
57
+
58
+ buffer = None
59
+ if return_object :
60
+ buffer = bytearray (32 )
61
+ # ] = 93, [ = 91
62
+ # } = 125, { = 123
63
+ buffer [0 ] = closer - 2
64
+
49
65
while close_stack :
50
66
char = self .read ()
51
67
count += 1
68
+ if buffer :
69
+ if count == len (buffer ):
70
+ new_buffer = bytearray (len (buffer ) + 32 )
71
+ new_buffer [: len (buffer )] = buffer
72
+ buffer = new_buffer
73
+ buffer [count ] = char
52
74
if char == close_stack [- 1 ]:
53
75
close_stack .pop ()
54
76
elif char == ord ('"' ):
@@ -63,6 +85,9 @@ def fast_forward(self, closer):
63
85
close_stack .append (ord ("}" ))
64
86
elif char == ord ("[" ):
65
87
close_stack .append (ord ("]" ))
88
+ if buffer :
89
+ value_string = bytes (memoryview (buffer )[: count + 1 ]).decode ("utf-8" )
90
+ return json .loads (value_string )
66
91
return False
67
92
68
93
def next_value (self , endswith = None ):
@@ -77,10 +102,10 @@ def next_value(self, endswith=None):
77
102
except EOFError :
78
103
char = endswith
79
104
if not in_string and (char == endswith or char in (ord ("]" ), ord ("}" ))):
105
+ self .last_char = char
80
106
if len (buf ) == 0 :
81
107
return None
82
108
value_string = bytes (buf ).decode ("utf-8" )
83
- # print(f"{repr(value_string)}, {endswith=}")
84
109
return json .loads (value_string )
85
110
if char == ord ("{" ):
86
111
return TransientObject (self )
@@ -94,40 +119,56 @@ def next_value(self, endswith=None):
94
119
buf .append (char )
95
120
96
121
97
- class Transient : # pylint: disable=too-few-public-methods
122
+ class Transient :
98
123
"""Transient object representing a JSON object."""
99
124
100
- # This is helpful for checking that something is a TransientList or TransientObject.
101
-
102
-
103
- class TransientList (Transient ):
104
- """Transient object that acts like a list through the stream."""
105
-
106
125
def __init__ (self , stream ):
126
+ self .active_child = None
107
127
self .data = stream
108
128
self .done = False
109
- self .active_child = None
129
+ self .has_read = False
130
+ self .finish_char = ""
110
131
111
132
def finish (self ):
112
133
"""Consume all of the characters for this list from the stream."""
113
134
if not self .done :
114
135
if self .active_child :
115
136
self .active_child .finish ()
116
137
self .active_child = None
117
- self .data .fast_forward ("]" )
138
+ self .data .fast_forward (self .finish_char )
139
+ self .done = True
140
+
141
+ def as_object (self ):
142
+ """Consume all of the characters for this list from the stream and return as an object."""
143
+ if self .has_read :
144
+ raise BufferError ("Object has already been partly read." )
145
+
118
146
self .done = True
147
+ return self .data .fast_forward (self .finish_char , return_object = True )
148
+
149
+
150
+ class TransientList (Transient ):
151
+ """Transient object that acts like a list through the stream."""
152
+
153
+ def __init__ (self , stream ):
154
+ super ().__init__ (stream )
155
+ self .finish_char = "]"
119
156
120
157
def __iter__ (self ):
121
158
return self
122
159
123
160
def __next__ (self ):
161
+ self .has_read = True
162
+
124
163
if self .active_child :
125
164
self .active_child .finish ()
126
165
self .done = self .data .fast_forward ("," )
127
166
self .active_child = None
128
167
if self .done :
129
168
raise StopIteration ()
130
169
next_value = self .data .next_value ("," )
170
+ if self .data .last_char == ord ("]" ):
171
+ self .done = True
131
172
if next_value is None :
132
173
self .done = True
133
174
raise StopIteration ()
@@ -140,42 +181,39 @@ class TransientObject(Transient):
140
181
"""Transient object that acts like a dictionary through the stream."""
141
182
142
183
def __init__ (self , stream ):
143
- self . data = stream
144
- self .done = False
145
- self .buf = array . array ( "B" )
184
+ super (). __init__ ( stream )
185
+ self .finish_char = "}"
186
+ self .active_child_key = None
146
187
147
- self .active_child = None
188
+ def __getitem__ (self , key ):
189
+ if self .active_child and self .active_child_key == key :
190
+ return self .active_child
148
191
149
- def finish (self ):
150
- """Consume all of the characters for this object from the stream."""
151
- if not self .done :
152
- if self .active_child :
153
- self .active_child .finish ()
154
- self .active_child = None
155
- self .data .fast_forward ("}" )
156
- self .done = True
192
+ self .has_read = True
157
193
158
- def __getitem__ (self , key ):
159
194
if self .active_child :
160
195
self .active_child .finish ()
161
196
self .done = self .data .fast_forward ("," )
162
197
self .active_child = None
198
+ self .active_child_key = None
163
199
if self .done :
164
- raise KeyError ()
200
+ raise KeyError (key )
165
201
166
- while True :
202
+ while not self . done :
167
203
current_key = self .data .next_value (":" )
168
204
if current_key is None :
169
- # print("object done", self)
170
205
self .done = True
171
206
break
172
207
if current_key == key :
173
208
next_value = self .data .next_value ("," )
209
+ if self .data .last_char == ord ("}" ):
210
+ self .done = True
174
211
if isinstance (next_value , Transient ):
175
212
self .active_child = next_value
213
+ self .active_child_key = key
176
214
return next_value
177
- self .data .fast_forward ("," )
178
- raise KeyError ()
215
+ self .done = self . data .fast_forward ("," )
216
+ raise KeyError (key )
179
217
180
218
181
219
def load (data_iter ):
0 commit comments