Skip to content

Commit c65dbb4

Browse files
authored
Merge pull request #3381 from westfish/uie_reader_memory_overflow
fix uie dataloader memory overflow
2 parents db1f991 + 4c4f961 commit c65dbb4

File tree

1 file changed

+6
-1
lines changed

1 file changed

+6
-1
lines changed

model_zoo/uie/utils.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -222,6 +222,10 @@ def reader(data_path, max_seq_len=512):
222222
if len(content) <= max_content_len:
223223
yield json_line
224224
else:
225+
if result['end'] - result['start'] > max_content_len:
226+
logger.warn(
227+
"result['end '] - result ['start'] exceeds max_content_len, which will result in no valid instance being returned"
228+
)
225229
result_list = json_line['result_list']
226230
json_lines = []
227231
accumulate = 0
@@ -230,7 +234,8 @@ def reader(data_path, max_seq_len=512):
230234

231235
for result in result_list:
232236
if result['start'] + 1 <= max_content_len < result[
233-
'end']:
237+
'end'] and result['end'] - result[
238+
'start'] <= max_content_len:
234239
max_content_len = result['start']
235240
break
236241

0 commit comments

Comments
 (0)