In [5]:
import os
import sys
import cv2
import json
import shutil
from glob import glob
from tqdm import tqdm
from pathlib import Path

from utils.table2label import table2layout, fuse_gt_info, judge_error
from utils.table_helper import correct_table



def table2label(table_dir, label_dir, error_file_path):
    table_error = {}
    json_files = sorted(glob(os.path.join(table_dir, '*.json')))
    for idx, json_path in tqdm(enumerate(json_files), total=len(json_files)):
        json_dir = os.path.dirname(json_path)
        json_name = os.path.basename(json_path)
        # json_name = "06615.json"
        # json_path = os.path.join(json_dir, json_name)

        json_id = json_name.split('.')[0]
        table = json.load(open(json_path, 'r'))

        # table['is_wireless'] = True

        # table = correct_table(table)
        try:
            gt_label = table2layout(table)
        except:
            table_error[json_name] = 'table2layout error'
            continue

        ## 有线表格得到的bbox还是cell框，不是text框
        gt_label = fuse_gt_info(gt_label, table)

        valid, msg = judge_error(table, gt_label)
        if not valid:
            print(json_name, msg)
            table_error[json_name] = msg
            continue

        gt_json_path = os.path.join(label_dir, f'{json_id}-gt.json')
        json.dump(gt_label, open(gt_json_path, 'w'), indent=4)
    json.dump(table_error, open(error_file_path, 'w'), indent=4)

    print('table error: {}'.format(len(table_error)))

## STEP.1 gen_gt_labels

In [6]:
'''
输入
    训练集目录: {dataset_root}/train
输出
    训练集标注目录: {dataset_root}/train_gt_json/
    {dataset_root}/train_error.json

使用 fix_gt_table 前 报错的：684
使用 fix_gt_table 后 报错的：665
    + 清除area==0的数据：664
'''
DATASET = "train_jpg480max"
DATASET_ROOT = '/media/ubuntu/Date12/TableStruct/new_data'

TABLE_DIR = os.path.join(DATASET_ROOT, DATASET)
LABEL_DIR = os.path.join(DATASET_ROOT, f'{DATASET}_gt_json')
TABLE_ERROR_PATH = os.path.join(DATASET_ROOT, f'{DATASET}_error.json')

if os.path.exists(LABEL_DIR):
    shutil.rmtree(LABEL_DIR)
Path.mkdir(Path(LABEL_DIR), parents=True)

table2label(TABLE_DIR, LABEL_DIR, TABLE_ERROR_PATH)


  0%|          | 35/12104 [00:01<09:39, 20.84it/s]

00029.json line idx:[[6], [12], [113]] not find


  0%|          | 60/12104 [00:02<09:40, 20.74it/s]

00057.json line idx:[[34]] not find


  1%|          | 90/12104 [00:04<05:58, 33.53it/s]

00084.json line idx:[[20], [61], [62], [103], [104]] not find


  1%|▏         | 174/12104 [00:05<03:03, 65.10it/s]

00169.json line idx:[[0], [2], [9], [10], [16], [17]] not find


  2%|▏         | 258/12104 [00:07<03:45, 52.46it/s]

00250.json line idx:[[6]] not find


  2%|▏         | 285/12104 [00:07<03:22, 58.29it/s]

00273.json line idx:[[2], [8]] not find
00280.json line idx:[[35]] not find


  3%|▎         | 316/12104 [00:08<03:03, 64.29it/s]

00301.json line idx:[[17], [18], [20]] not find
00303.json line idx:[[9], [17], [18]] not find
00307.json line idx:[[4], [18], [20]] not find
00314.json line idx:[[32], [35]] not find


  3%|▎         | 330/12104 [00:08<03:32, 55.51it/s]

00325.json line idx:[[19], [20]] not find


  3%|▎         | 341/12104 [00:08<05:04, 38.66it/s]

00334.json line idx:[[0], [1], [2], [3]] not find


  3%|▎         | 354/12104 [00:09<06:12, 31.57it/s]

00353.json line idx:[[13], [23], [47], [48], [49], [50], [72], [73], [74], [75]] not find


  3%|▎         | 365/12104 [00:09<06:12, 31.50it/s]

00358.json line idx:[[0], [13], [18], [23]] not find


  3%|▎         | 394/12104 [00:10<02:51, 68.42it/s]

00374.json line idx:[[18]] not find


  4%|▍         | 493/12104 [00:13<15:29, 12.50it/s] 

00489.json line idx:[[26], [27], [36], [37]] not find


  5%|▍         | 586/12104 [00:15<02:48, 68.35it/s]

00573.json line idx:[[0], [2]] not find


  5%|▍         | 596/12104 [00:15<02:41, 71.16it/s]

00600.json line idx:[[0], [1], [35], [36]] not find
00602.json line idx:[[4], [11], [12]] not find


  5%|▌         | 619/12104 [00:16<03:34, 53.44it/s]

00611.json line idx:[[3]] not find


  5%|▌         | 646/12104 [00:17<04:39, 40.94it/s]

00641.json line idx:[[13], [14], [15], [16]] not find


  6%|▌         | 678/12104 [00:17<03:43, 51.17it/s]

00668.json line idx:[[4], [6]] not find
00674.json line idx:[[34]] not find


  6%|▌         | 739/12104 [00:19<03:56, 48.09it/s]

00731.json line idx:[[0], [1], [2], [3]] not find
00741.json line idx:[[14], [33], [34], [49]] not find


  6%|▌         | 750/12104 [00:19<04:26, 42.53it/s]

00745.json line idx:[[24]] not find


  6%|▋         | 767/12104 [00:19<05:22, 35.12it/s]

00759.json line idx:[[102]] not find


  6%|▋         | 779/12104 [00:20<06:11, 30.49it/s]

00773.json line idx:[[39]] not find


  7%|▋         | 788/12104 [00:20<07:12, 26.16it/s]

00782.json line idx:[[111], [127]] not find


  7%|▋         | 901/12104 [00:22<03:45, 49.77it/s] 

00902.json line idx:[[0], [1], [2], [3], [7], [8], [9], [10], [11], [12], [13], [14]] not find


  9%|▉         | 1127/12104 [00:28<02:50, 64.30it/s]

01119.json line idx:[[5], [40]] not find


  9%|▉         | 1134/12104 [00:28<03:07, 58.54it/s]

01131.json line idx:[[11], [61]] not find
01136.json line idx:[[87]] not find


  9%|▉         | 1141/12104 [00:29<03:55, 46.59it/s]

01138.json line idx:[[16], [19], [40], [41]] not find


 10%|▉         | 1203/12104 [00:30<03:25, 52.95it/s]

01203.json line idx:[[28], [31]] not find


 11%|█▏        | 1363/12104 [00:34<07:22, 24.25it/s]

01361.json line idx:[[0], [4], [5], [6]] not find


 11%|█▏        | 1386/12104 [00:35<06:19, 28.21it/s]

01378.json line idx:[[63], [64]] not find


 12%|█▏        | 1480/12104 [00:36<02:30, 70.61it/s]

01475.json line idx:[[9]] not find


 12%|█▏        | 1509/12104 [00:37<03:29, 50.46it/s]

01498.json line idx:[[0]] not find
01499.json line idx:[[37]] not find


 13%|█▎        | 1602/12104 [00:39<02:41, 64.83it/s]

01586.json line idx:[[6], [7], [8], [9], [10], [14], [15], [16], [17], [18], [21], [22], [23], [24], [25], [26], [31], [32]] not find


 14%|█▍        | 1681/12104 [00:41<03:51, 45.06it/s]

01668.json line idx:[[57], [73], [114]] not find


 15%|█▍        | 1764/12104 [00:42<02:23, 72.19it/s] 

01768.json line idx:[[84], [88]] not find


 15%|█▍        | 1800/12104 [00:44<10:57, 15.68it/s]

01797.json line idx:[[137], [198]] not find


 16%|█▌        | 1961/12104 [00:48<02:36, 64.70it/s]

01947.json line idx:[[83], [84], [85], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95]] not find
01948.json line idx:[[12]] not find


 16%|█▋        | 1992/12104 [00:49<02:57, 57.13it/s]

01990.json line idx:[[0]] not find


 17%|█▋        | 2004/12104 [00:50<05:26, 30.96it/s]

01997.json line idx:[[0], [1], [2], [3]] not find


 17%|█▋        | 2075/12104 [00:51<03:03, 54.59it/s]

02065.json line idx:[[25], [26], [27], [29], [30], [31], [32], [33], [38]] not find
02077.json line idx:[[0]] not find


 18%|█▊        | 2146/12104 [00:53<02:44, 60.71it/s]

02125.json line idx:[[16], [18], [19]] not find


 18%|█▊        | 2215/12104 [00:54<03:55, 41.98it/s] 

02209.json line idx:[[2], [3]] not find


 18%|█▊        | 2229/12104 [00:55<03:50, 42.93it/s]

02223.json line idx:[[1]] not find


 19%|█▉        | 2296/12104 [00:56<02:55, 55.74it/s]

02284.json line idx:[[26]] not find


 19%|█▉        | 2316/12104 [00:56<04:36, 35.44it/s]

02315.json line idx:[[67], [68], [69], [70], [127], [128]] not find


 20%|██        | 2471/12104 [00:59<02:22, 67.38it/s]

02465.json line idx:[[101]] not find


 21%|██        | 2489/12104 [00:59<02:16, 70.47it/s]

02478.json line idx:[[16]] not find
02489.json line idx:[[6], [32]] not find


 21%|██        | 2559/12104 [01:01<01:51, 85.71it/s]

02561.json line idx:[[224], [225], [226], [227], [228]] not find
02565.json line idx:[[1], [2], [3], [5], [7], [9]] not find


 21%|██        | 2569/12104 [01:01<04:09, 38.18it/s]

02569.json line idx:[[0], [1]] not find


 21%|██▏       | 2577/12104 [01:02<06:53, 23.03it/s]

02572.json line idx:[[0], [1], [2], [3], [4], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30]] not find
02575.json line idx:[[6], [8]] not find


 21%|██▏       | 2589/12104 [01:02<05:29, 28.91it/s]

02584.json line idx:[[19]] not find


 22%|██▏       | 2627/12104 [01:03<02:58, 52.98it/s]

02619.json line idx:[[56], [57]] not find


 22%|██▏       | 2660/12104 [01:04<03:53, 40.47it/s]

02655.json line idx:[[41], [42]] not find


 22%|██▏       | 2665/12104 [01:04<04:50, 32.47it/s]

02663.json line idx:[[18], [19], [20], [22], [23], [24], [25]] not find


 25%|██▍       | 2977/12104 [01:08<03:19, 45.69it/s] 

02967.json line idx:[[2], [6]] not find


 25%|██▍       | 3014/12104 [01:09<03:13, 47.10it/s]

03007.json line idx:[[5], [6], [7], [8]] not find


 25%|██▌       | 3049/12104 [01:10<03:56, 38.27it/s]

03051.json line idx:[[56], [62], [68]] not find


 25%|██▌       | 3062/12104 [01:11<05:46, 26.07it/s]

03056.json layout error: cell_idx: 0, row_span: [0, 12], col_span: [0, 9]


 25%|██▌       | 3074/12104 [01:11<05:25, 27.78it/s]

03068.json line idx:[[2], [3], [4]] not find


 26%|██▌       | 3151/12104 [01:12<02:16, 65.49it/s]

03141.json line idx:[[5], [9], [10]] not find


 27%|██▋       | 3299/12104 [01:15<04:35, 31.97it/s]

03296.json line idx:[[87]] not find


 28%|██▊       | 3408/12104 [01:17<02:07, 68.10it/s]

03395.json line idx:[[24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [40], [41]] not find


 31%|███       | 3773/12104 [01:23<02:33, 54.42it/s] 

03766.json line idx:[[32], [33], [34]] not find


 33%|███▎      | 3969/12104 [01:27<02:32, 53.43it/s]

03952.json line idx:[[38], [40], [41], [47], [55], [73], [166], [180], [184]] not find
03956.json line idx:[[67], [68], [69]] not find


 33%|███▎      | 4032/12104 [01:29<03:42, 36.26it/s]

04023.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7]] not find
04024.json line idx:[[37]] not find


 33%|███▎      | 4043/12104 [01:30<03:41, 36.33it/s]

04037.json line idx:[[24], [48], [49]] not find
04043.json line idx:[[30], [32], [39], [40]] not find


 34%|███▎      | 4071/12104 [01:30<02:30, 53.25it/s]

04067.json line idx:[[3]] not find


 34%|███▍      | 4090/12104 [01:30<02:40, 49.85it/s]

04081.json line idx:[[14]] not find


 36%|███▋      | 4408/12104 [01:35<02:12, 58.09it/s]

04399.json line idx:[[5], [18]] not find
04400.json line idx:[[21], [24], [25], [26], [27], [28], [29], [30], [35]] not find


 37%|███▋      | 4503/12104 [01:37<02:09, 58.87it/s]

04493.json line idx:[[0]] not find
04503.json layout error: cell_idx: 5, row_span: [1, 6], col_span: [0, 5]


 38%|███▊      | 4539/12104 [01:38<03:04, 41.02it/s]

04533.json line idx:[[70], [90]] not find


 39%|███▊      | 4669/12104 [01:40<02:30, 49.38it/s]

04668.json layout error: cell_idx: 2, row_span: [0, 2], col_span: [6, 9]


 39%|███▉      | 4705/12104 [01:41<02:30, 49.04it/s]

04701.json line idx:[[9], [10]] not find
04705.json line idx:[[0], [1]] not find


 39%|███▉      | 4756/12104 [01:42<01:54, 64.29it/s]

04753.json line idx:[[14]] not find
04755.json line idx:[[51], [52], [53], [54], [55], [56], [57], [58], [59]] not find


 40%|███▉      | 4787/12104 [01:43<02:13, 54.95it/s]

04778.json line idx:[[6], [8]] not find


 40%|███▉      | 4801/12104 [01:43<02:24, 50.55it/s]

04789.json layout error: cell_idx: 9, row_span: [0, 1], col_span: [9, 12]


 40%|███▉      | 4830/12104 [01:44<03:15, 37.27it/s]

04822.json line idx:[[0]] not find
04826.json line idx:[[47]] not find
04828.json line idx:[[0], [1]] not find


 40%|███▉      | 4840/12104 [01:44<03:15, 37.22it/s]

04835.json line idx:[[12]] not find


 40%|████      | 4856/12104 [01:45<03:48, 31.77it/s]

04849.json line idx:[[185]] not find


 42%|████▏     | 5047/12104 [01:47<01:34, 74.41it/s]

05027.json line idx:[[4], [9], [10], [11], [25], [26], [27], [28], [40], [41], [42], [43], [63], [64], [65], [66], [67], [68], [69], [72]] not find


 43%|████▎     | 5252/12104 [01:51<03:54, 29.25it/s]

05250.json line idx:[[5]] not find


 45%|████▌     | 5467/12104 [01:55<01:53, 58.39it/s]

05456.json line idx:[[23]] not find


 45%|████▌     | 5498/12104 [01:56<01:42, 64.47it/s]

05491.json line idx:[[1], [4]] not find
05494.json line idx:[[1], [2], [3], [4], [5], [6], [7], [11], [12], [16], [17], [18], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [39]] not find
05495.json line idx:[[1]] not find


 45%|████▌     | 5506/12104 [01:56<02:30, 43.75it/s]

05500.json line idx:[[1], [4], [5], [6], [7], [8], [9], [10], [44], [46], [47], [48], [49]] not find


 46%|████▌     | 5548/12104 [01:57<02:04, 52.82it/s]

05539.json line idx:[[2], [36], [37], [38], [61], [105], [106], [107], [108], [127], [128], [129]] not find
05540.json line idx:[[2], [133], [134]] not find
05547.json line idx:[[2], [3]] not find


 46%|████▌     | 5576/12104 [01:57<02:44, 39.61it/s]

05568.json line idx:[[24]] not find


 46%|████▋     | 5605/12104 [01:58<03:20, 32.35it/s]

05600.json line idx:[[45]] not find


 48%|████▊     | 5788/12104 [02:01<00:52, 120.27it/s]

05769.json line idx:[[5], [8], [10], [19], [24], [27]] not find


 50%|████▉     | 5997/12104 [02:04<02:12, 45.92it/s] 

05993.json line idx:[[1]] not find


 50%|████▉     | 6028/12104 [02:05<02:10, 46.72it/s]

06020.json line idx:[[0], [1], [6], [9], [10], [104]] not find


 50%|████▉     | 6042/12104 [02:05<02:02, 49.60it/s]

06035.json line idx:[[40], [42], [43], [44], [57]] not find


 50%|█████     | 6053/12104 [02:06<02:34, 39.29it/s]

06048.json line idx:[[0], [1], [4], [8], [13], [96], [97], [111], [112], [113], [114]] not find


 50%|█████     | 6079/12104 [02:07<03:40, 27.29it/s]

06077.json line idx:[[157]] not find
06079.json line idx:[[7], [8], [12], [15], [16], [17], [20], [23], [24], [25], [26], [27], [32], [34], [36], [37], [43], [44], [45], [46], [48], [50], [51], [103]] not find


 50%|█████     | 6109/12104 [02:08<02:26, 40.84it/s]

06098.json line idx:[[1], [7], [8], [11]] not find


 51%|█████     | 6128/12104 [02:08<01:59, 50.12it/s]

06120.json line idx:[[3], [4], [5]] not find


 51%|█████     | 6152/12104 [02:08<02:03, 48.36it/s]

06142.json line idx:[[0], [1], [2], [3], [4], [5]] not find


 51%|█████     | 6183/12104 [02:09<01:49, 54.11it/s]

06175.json line idx:[[2], [9]] not find


 51%|█████     | 6199/12104 [02:09<02:24, 40.85it/s]

06193.json line idx:[[5], [80]] not find


 52%|█████▏    | 6278/12104 [02:12<01:45, 55.33it/s]

06267.json line idx:[[4], [5]] not find


 52%|█████▏    | 6295/12104 [02:12<02:35, 37.31it/s]

06287.json line idx:[[19], [21], [23], [24], [25]] not find


 52%|█████▏    | 6321/12104 [02:13<02:35, 37.15it/s]

06316.json line idx:[[5], [6], [17]] not find


 53%|█████▎    | 6363/12104 [02:14<02:48, 34.13it/s]

06360.json line idx:[[19], [81]] not find


 53%|█████▎    | 6373/12104 [02:14<03:12, 29.75it/s]

06365.json line idx:[[46], [48], [52], [53]] not find


 54%|█████▍    | 6545/12104 [02:19<02:29, 37.08it/s]

06543.json line idx:[[6], [8]] not find


 54%|█████▍    | 6589/12104 [02:20<02:58, 30.96it/s]

06584.json line idx:[[15]] not find


 55%|█████▍    | 6639/12104 [02:21<02:35, 35.15it/s]

06632.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31]] not find


 55%|█████▌    | 6666/12104 [02:22<02:55, 31.00it/s]

06660.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15]] not find


 55%|█████▌    | 6715/12104 [02:25<03:39, 24.52it/s]

06707.json line idx:[[140], [141], [142], [143], [144], [145], [146], [147], [148], [149], [150], [151], [152]] not find
06716.json line idx:[[0], [1], [2]] not find
06717.json line idx:[[42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62]] not find


 56%|█████▌    | 6719/12104 [02:25<03:13, 27.84it/s]

06719.json line idx:[[0], [1], [2], [3], [4], [54]] not find


 56%|█████▌    | 6744/12104 [02:26<03:10, 28.16it/s]

06739.json line idx:[[20], [21], [85], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95]] not find
06743.json line idx:[[4], [5], [6], [7], [8], [9], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95], [96], [97], [98], [99], [100], [101], [102], [103], [104], [105], [106], [107], [108], [109], [110], [111], [112], [113], [114], [115], [116], [117], [118], [119], [120], [121], [122], [123], [124], [125], [126], [127], [128], [129], [130], [131], [132]] not find


 56%|█████▌    | 6771/12104 [02:27<02:15, 39.39it/s]

06769.json line idx:[[0], [1], [2], [3], [4], [5]] not find


 56%|█████▌    | 6789/12104 [02:28<04:06, 21.60it/s]

06782.json line idx:[[42]] not find


 56%|█████▌    | 6797/12104 [02:29<03:42, 23.81it/s]

06791.json line idx:[[1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50]] not find
06794.json line idx:[[0], [1], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46]] not find


 56%|█████▋    | 6821/12104 [02:29<02:20, 37.71it/s]

06820.json line idx:[[21], [22], [23], [27], [28], [29], [30], [31], [32], [33], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67]] not find


 57%|█████▋    | 6909/12104 [02:32<02:41, 32.26it/s]

06907.json line idx:[[0], [5], [13], [14]] not find


 57%|█████▋    | 6947/12104 [02:34<02:41, 32.00it/s]

06942.json line idx:[[89]] not find


 58%|█████▊    | 6965/12104 [02:35<03:11, 26.82it/s]

06960.json line idx:[[0]] not find
06964.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19]] not find


 58%|█████▊    | 6977/12104 [02:35<02:55, 29.17it/s]

06971.json line idx:[[7], [8], [9], [10], [11], [14], [15], [16], [17], [18]] not find


 58%|█████▊    | 6989/12104 [02:35<02:45, 30.93it/s]

06984.json line idx:[[17], [18], [80], [85], [86], [87], [88]] not find
06989.json line idx:[[1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11]] not find


 58%|█████▊    | 7012/12104 [02:36<02:58, 28.50it/s]

07003.json line idx:[[119]] not find


 58%|█████▊    | 7038/12104 [02:37<02:44, 30.75it/s]

07033.json line idx:[[71]] not find


 59%|█████▊    | 7087/12104 [02:39<02:36, 32.11it/s]

07080.json line idx:[[27]] not find


 59%|█████▉    | 7150/12104 [02:42<03:19, 24.79it/s]

07143.json line idx:[[21], [38], [58], [68]] not find


 59%|█████▉    | 7167/12104 [02:43<03:02, 27.02it/s]

07164.json line idx:[[0]] not find
07166.json line idx:[[22]] not find
07167.json line idx:[[0], [54]] not find


 59%|█████▉    | 7183/12104 [02:43<02:51, 28.71it/s]

07179.json line idx:[[1], [3], [4], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [43], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [80], [81], [82], [86], [87], [88], [96], [97], [98], [105], [106], [107], [108], [109], [110], [117], [118], [119], [120], [121], [122], [126], [127], [128], [129], [130], [131], [136], [137], [142], [143]] not find


 59%|█████▉    | 7199/12104 [02:44<02:04, 39.35it/s]

07187.json line idx:[[0], [1], [2], [3], [4], [5], [7], [8], [10], [12], [13], [14], [15], [16], [17], [19], [20], [21], [22], [23], [24], [26], [27], [28], [29], [30], [31], [32], [34], [35], [36], [37], [38], [40], [41], [42], [43], [44], [45], [47], [48], [49], [50], [51], [52], [54], [55], [56], [57], [58], [60], [61], [62], [63], [64], [65], [67], [68], [69], [70], [71], [72], [74], [75], [76], [77], [80], [81], [82], [83], [84], [85], [86], [88], [89], [90], [91], [92], [93], [95], [96], [97], [98], [99], [100], [102], [103], [104], [105], [106], [107], [109], [110], [111], [112], [113], [115], [116], [117], [118], [119], [120], [122], [123], [124], [125], [126], [128], [129], [130], [131], [132]] not find


 60%|█████▉    | 7211/12104 [02:44<01:41, 48.35it/s]

07208.json line idx:[[5]] not find


 60%|██████    | 7276/12104 [02:47<04:00, 20.08it/s]

07271.json line idx:[[0], [1], [2], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95], [96]] not find


 61%|██████    | 7353/12104 [02:50<02:14, 35.41it/s]

07345.json line idx:[[22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37]] not find


 61%|██████    | 7367/12104 [02:51<02:44, 28.83it/s]

07367.json line idx:[[101]] not find


 61%|██████    | 7393/12104 [02:52<02:56, 26.72it/s]

07387.json line idx:[[8], [9], [10], [11], [12], [13], [14], [15], [16], [25], [26], [35], [36], [45], [50], [59], [64], [73], [76]] not find
07391.json line idx:[[0]] not find


 62%|██████▏   | 7472/12104 [02:54<02:11, 35.35it/s]

07474.json line idx:[[17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95], [96], [97], [98], [99], [100], [101], [102], [103], [104], [105], [106], [107], [108], [109], [110], [111], [112], [113], [114], [115], [116], [117], [118], [119], [120], [121], [122], [123], [124], [125], [126], [127], [128], [129]] not find


 62%|██████▏   | 7496/12104 [02:56<04:13, 18.19it/s]

07494.json line idx:[[54]] not find


 62%|██████▏   | 7505/12104 [02:56<04:53, 15.65it/s]

07503.json line idx:[[0]] not find


 62%|██████▏   | 7537/12104 [02:57<01:56, 39.09it/s]

07533.json layout error: cell_idx: 5, row_span: [2, 8], col_span: [0, 4]


 63%|██████▎   | 7572/12104 [02:58<01:36, 46.78it/s]

07564.json line idx:[[0], [1], [2], [3]] not find


 63%|██████▎   | 7578/12104 [02:58<01:38, 45.74it/s]

07576.json line idx:[[164]] not find
07577.json line idx:[[89]] not find


 63%|██████▎   | 7596/12104 [02:59<02:43, 27.61it/s]

07593.json line idx:[[23]] not find


 63%|██████▎   | 7635/12104 [03:01<03:15, 22.83it/s]

07633.json line idx:[[0], [1], [2], [4], [5], [6], [7], [8], [9], [11], [12], [13], [14], [15], [16], [17], [19], [20], [21], [22], [23], [24], [26], [27], [28], [29], [30], [31], [33], [34], [35], [36], [37], [38], [39], [40], [42], [43], [44], [45], [46], [47], [49], [50], [51], [52], [53], [54], [55], [56], [58], [59], [60], [61], [62], [63], [65], [66], [67], [68], [69], [70], [71], [72], [74], [75], [76], [77], [78], [79], [81], [82], [83], [84], [85], [86], [87], [88], [89], [91], [92], [93], [94], [95], [97], [98], [99], [100], [101], [102], [104], [105], [106], [107], [108], [110], [111], [112], [113], [114], [115], [116], [117], [118], [120], [121], [122], [123], [124], [125], [127], [128], [129], [130], [131], [132], [133], [134], [136], [137], [138], [139], [140], [142], [143], [144], [145], [146], [147], [148], [150], [151], [152], [153], [154], [155], [156], [157], [158]] not find


 63%|██████▎   | 7645/12104 [03:01<02:53, 25.66it/s]

07642.json line idx:[[0]] not find


 63%|██████▎   | 7654/12104 [03:02<02:05, 35.49it/s]

07655.json line idx:[[29], [30], [31], [32], [33], [34], [35]] not find


 64%|██████▎   | 7700/12104 [03:03<02:55, 25.09it/s]

07697.json line idx:[[62], [63]] not find


 64%|██████▎   | 7711/12104 [03:04<02:57, 24.78it/s]

07709.json line idx:[[57], [128]] not find
07711.json line idx:[[0], [2], [17], [22], [27], [47], [52], [59], [63], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85]] not find


 64%|██████▍   | 7717/12104 [03:04<03:59, 18.32it/s]

07713.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58]] not find
07717.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [13], [14], [15], [16]] not find


 64%|██████▍   | 7723/12104 [03:04<03:00, 24.29it/s]

07719.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73]] not find
07721.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8]] not find
07722.json line idx:[[0], [1], [2], [3], [44], [55], [66], [72], [88], [89]] not find


 64%|██████▍   | 7745/12104 [03:05<03:03, 23.73it/s]

07738.json line idx:[[43]] not find
07743.json line idx:[[70]] not find


 64%|██████▍   | 7778/12104 [03:06<01:39, 43.28it/s]

07767.json line idx:[[41], [42]] not find


 64%|██████▍   | 7806/12104 [03:07<02:19, 30.80it/s]

07805.json line idx:[[185], [187], [189], [191]] not find


 65%|██████▍   | 7828/12104 [03:08<02:08, 33.18it/s]

07823.json line idx:[[0], [1], [2], [113], [114], [115], [116], [117], [118], [119], [120], [121], [122]] not find
07827.json line idx:[[62]] not find


 65%|██████▍   | 7841/12104 [03:08<02:42, 26.30it/s]

07835.json line idx:[[0], [11], [12], [18], [24], [35], [36]] not find


 65%|██████▌   | 7904/12104 [03:10<02:07, 32.84it/s]

07903.json line idx:[[120]] not find


 66%|██████▌   | 7934/12104 [03:11<02:15, 30.70it/s]

07930.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79]] not find
07932.json line idx:[[0], [1], [2], [3], [4], [5]] not find


 66%|██████▌   | 7948/12104 [03:12<02:05, 33.01it/s]

07941.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [14], [15], [16], [17], [23], [24], [25], [26], [27], [28], [29], [30], [35], [36], [37], [38]] not find


 66%|██████▌   | 7956/12104 [03:12<02:20, 29.52it/s]

07951.json line idx:[[0], [5], [8], [9], [10], [11], [12], [15], [16], [17], [18], [20], [23], [24], [25], [28], [30], [31], [32], [35], [37], [38], [39], [42], [44], [45], [46], [49], [51], [52], [53], [56], [58], [59], [60], [62], [65], [66], [67], [70], [72], [73], [74], [77], [79], [80], [82], [85], [87], [89], [91], [92], [96], [97], [99], [101], [103], [104], [107], [109], [113], [115], [117], [122], [124], [125], [126], [127], [129], [131], [132], [133], [134], [138], [139], [140], [143], [145], [147], [148], [151], [152], [153], [157], [158], [159], [165], [166], [167], [170], [171], [172], [173], [174], [175], [176], [177], [178], [179], [180], [181], [182], [183]] not find


 66%|██████▌   | 7966/12104 [03:12<01:58, 34.93it/s]

07962.json line idx:[[1], [2], [3]] not find
07969.json line idx:[[0], [1], [3], [17], [23], [29], [35]] not find


 66%|██████▌   | 7987/12104 [03:13<03:23, 20.27it/s]

07985.json line idx:[[69]] not find


 66%|██████▋   | 8048/12104 [03:15<03:11, 21.21it/s]

08046.json line idx:[[43], [44], [70], [71], [72], [124], [125], [126]] not find


 67%|██████▋   | 8059/12104 [03:16<02:50, 23.66it/s]

08056.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7]] not find
08058.json line idx:[[149]] not find


 67%|██████▋   | 8079/12104 [03:16<02:05, 32.06it/s]

08069.json line idx:[[0], [1], [2], [3], [4], [15], [16], [17]] not find
08073.json line idx:[[44]] not find


 67%|██████▋   | 8094/12104 [03:17<02:42, 24.70it/s]

08088.json line idx:[[122], [123]] not find


 67%|██████▋   | 8130/12104 [03:18<01:27, 45.60it/s]

08118.json line idx:[[16]] not find


 67%|██████▋   | 8136/12104 [03:18<01:56, 34.15it/s]

08135.json line idx:[[68]] not find


 67%|██████▋   | 8156/12104 [03:19<02:37, 25.13it/s]

08152.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95], [96], [97], [98], [99], [100], [101], [102], [103]] not find
08153.json line idx:[[27], [32]] not find


 68%|██████▊   | 8194/12104 [03:21<01:46, 36.81it/s]

08184.json line idx:[[3], [6], [8], [13], [15], [18], [21], [23], [26], [28], [30], [33], [37], [40], [43], [45], [48], [50], [52], [54], [56], [58], [60], [62], [63], [66], [69], [73], [77], [81], [83], [86], [89], [91], [92], [93], [94], [95], [96]] not find
08190.json line idx:[[12]] not find


 68%|██████▊   | 8225/12104 [03:21<02:10, 29.62it/s]

08227.json line idx:[[0], [1], [2], [12], [53], [54], [55], [56], [57], [78]] not find


 68%|██████▊   | 8243/12104 [03:22<02:27, 26.12it/s]

08240.json line idx:[[30], [31], [32], [33], [34], [35], [36]] not find


 68%|██████▊   | 8253/12104 [03:23<02:21, 27.29it/s]

08245.json line idx:[[114]] not find
08246.json line idx:[[60]] not find
08248.json line idx:[[8], [9], [10], [11]] not find
08253.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40]] not find


 68%|██████▊   | 8270/12104 [03:23<01:39, 38.38it/s]

08263.json line idx:[[0], [1], [2], [3], [6], [8], [9], [10], [11], [13], [14], [15], [16], [17], [19], [20], [23], [24], [25], [26], [27], [28], [29], [31], [32], [33], [34], [35], [37], [38], [39], [40], [41], [43], [44], [45], [46], [48], [49], [50], [51], [53], [54], [55], [56], [57], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80]] not find


 68%|██████▊   | 8286/12104 [03:24<01:24, 45.38it/s]

08277.json line idx:[[16]] not find


 69%|██████▊   | 8314/12104 [03:24<01:30, 41.93it/s]

08315.json line idx:[[35]] not find


 69%|██████▉   | 8333/12104 [03:25<02:41, 23.36it/s]

08328.json line idx:[[15], [16], [17]] not find
08329.json line idx:[[29]] not find
08332.json line idx:[[0], [1], [2], [3], [5], [6], [7], [8], [9], [11], [12], [13], [14], [15], [17], [18], [19], [20], [21], [22], [23], [24], [25], [28], [29], [30], [31], [32], [33], [34], [35], [36], [39], [40], [41], [42], [43], [44], [45], [46], [47], [50], [51], [52], [53], [54], [55], [56], [57], [58], [61], [62], [63], [64], [65], [66], [67], [68], [69], [72], [73], [74], [75], [76], [77], [78], [79], [80], [83], [84], [85], [86], [87], [88], [89], [90], [91], [94], [95], [96], [97], [98], [99], [100], [101], [102], [105], [106], [107], [108], [109], [110], [111], [112], [113], [116], [117], [118], [119], [120], [121], [122], [123], [124], [127], [128], [129], [130], [131], [132], [133], [134], [135], [138], [139], [140], [141], [142], [143], [144], [145], [146], [149], [150], [151], [152], [153], [154], [155], [156], [157], [160], [161], [162], [163], [164], [165], [166], [167], [169], [171], 

 69%|██████▉   | 8356/12104 [03:26<02:04, 30.16it/s]

08350.json line idx:[[0], [4], [5], [8], [11], [13], [16], [17], [23], [24], [29], [31], [34], [37], [38], [39], [43], [44], [45], [50], [51], [57], [58], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76]] not find
08356.json line idx:[[0], [2], [3], [10], [26], [31], [36], [46], [55], [62], [65], [74], [76], [78], [80], [81], [82], [83], [84]] not find
08357.json line idx:[[10], [12], [13], [14], [15], [16], [17], [18], [19], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59]] not find


 69%|██████▉   | 8378/12104 [03:27<02:12, 28.10it/s]

08367.json line idx:[[0], [8], [17]] not find


 70%|██████▉   | 8437/12104 [03:29<02:03, 29.63it/s]

08428.json line idx:[[35]] not find


 70%|██████▉   | 8448/12104 [03:30<01:39, 36.81it/s]

08439.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [20], [21], [23], [24], [26], [27], [29], [31], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90], [91]] not find
08442.json line idx:[[64], [65], [66], [67], [68]] not find


 70%|███████   | 8489/12104 [03:31<01:26, 41.65it/s]

08481.json line idx:[[28], [29], [38], [39], [72], [73]] not find


 70%|███████   | 8505/12104 [03:31<01:19, 45.45it/s]

08502.json line idx:[[2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14]] not find


 70%|███████   | 8517/12104 [03:32<01:29, 39.89it/s]

08513.json line idx:[[12], [15], [21], [24], [31], [34]] not find


 71%|███████   | 8575/12104 [03:34<01:48, 32.61it/s]

08567.json line idx:[[62]] not find


 71%|███████   | 8597/12104 [03:35<01:12, 48.36it/s]

08586.json line idx:[[3]] not find


 71%|███████   | 8603/12104 [03:35<01:57, 29.92it/s]

08600.json line idx:[[0], [1], [2], [3], [4], [5], [6], [39], [40], [41], [42], [43], [44], [45]] not find


 71%|███████   | 8617/12104 [03:36<01:45, 33.19it/s]

08609.json line idx:[[6]] not find


 71%|███████▏  | 8631/12104 [03:36<01:48, 32.02it/s]

08625.json line idx:[[80]] not find
08630.json line idx:[[80]] not find


 71%|███████▏  | 8647/12104 [03:37<02:04, 27.66it/s]

08644.json line idx:[[0], [3], [4], [19], [20], [23], [24], [25], [26], [27], [28], [29]] not find


 72%|███████▏  | 8660/12104 [03:37<02:42, 21.13it/s]

08656.json line idx:[[105]] not find


 72%|███████▏  | 8698/12104 [03:39<01:24, 40.35it/s]

08686.json line idx:[[44]] not find


 72%|███████▏  | 8721/12104 [03:39<01:17, 43.76it/s]

08711.json line idx:[[11]] not find
08722.json line idx:[[9], [18], [21]] not find


 72%|███████▏  | 8756/12104 [03:40<01:32, 36.33it/s]

08748.json line idx:[[0]] not find
08754.json line idx:[[8], [9], [10], [11], [12], [13], [16], [17], [18], [19], [20], [21], [24], [27], [30], [32], [34], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [62], [64], [65], [67], [68], [70], [71], [74], [75], [76], [77], [78], [79], [81], [82], [83], [84], [86], [87], [88], [89], [90], [124], [125], [126], [127], [132], [133], [134], [135], [140], [141], [142], [143], [148], [151], [152], [153], [154], [167], [170], [171], [172], [173], [174], [175], [176], [181], [182], [183], [184], [185], [186], [187], [188], [189], [194], [195], [196], [197], [198], [199], [204], [205], [206], [207], [208], [209]] not find


 72%|███████▏  | 8769/12104 [03:41<02:02, 27.20it/s]

08764.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95], [96], [97], [98], [99], [100], [101]] not find
08771.json line idx:[[34], [35]] not find


 73%|███████▎  | 8785/12104 [03:42<02:07, 25.94it/s]

08781.json line idx:[[0], [31]] not find


 73%|███████▎  | 8849/12104 [03:44<02:03, 26.37it/s]

08843.json line idx:[[2]] not find


 73%|███████▎  | 8870/12104 [03:45<01:49, 29.56it/s]

08865.json line idx:[[3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [119], [120], [121], [122], [123], [124], [125], [126], [127], [128], [129], [130], [131], [132], [133], [134], [135], [136], [137], [138], [139], [140], [141], [142], [167]] not find


 74%|███████▎  | 8925/12104 [03:47<01:53, 27.92it/s]

08920.json line idx:[[209]] not find
08923.json line idx:[[38], [39], [40]] not find


 74%|███████▍  | 8934/12104 [03:47<01:51, 28.55it/s]

08928.json line idx:[[7], [8], [9]] not find


 74%|███████▍  | 8942/12104 [03:47<01:40, 31.35it/s]

08936.json line idx:[[0], [15], [16], [31], [32], [47], [48], [49], [77], [78]] not find


 74%|███████▍  | 8999/12104 [03:50<02:11, 23.53it/s]

08995.json line idx:[[1]] not find
08997.json line idx:[[1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47]] not find
09006.json line idx:[[41]] not find


 74%|███████▍  | 9017/12104 [03:50<01:10, 43.52it/s]

09015.json line idx:[[94]] not find


 75%|███████▍  | 9033/12104 [03:51<01:58, 25.98it/s]

09026.json line idx:[[16], [17], [18], [19]] not find
09027.json line idx:[[29]] not find


 75%|███████▍  | 9042/12104 [03:51<01:39, 30.68it/s]

09036.json line idx:[[8], [9], [10], [64]] not find


 75%|███████▍  | 9053/12104 [03:51<01:28, 34.59it/s]

09046.json line idx:[[33], [34], [63], [64], [93], [94], [123]] not find


 75%|███████▌  | 9106/12104 [03:53<01:25, 35.21it/s]

09092.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14]] not find


 75%|███████▌  | 9117/12104 [03:54<01:24, 35.17it/s]

09111.json line idx:[[8]] not find
09114.json line idx:[[76]] not find


 75%|███████▌  | 9122/12104 [03:54<01:44, 28.58it/s]

09121.json line idx:[[18]] not find
09122.json line idx:[[66]] not find


 76%|███████▌  | 9150/12104 [03:55<01:33, 31.71it/s]

09145.json line idx:[[0], [1], [79], [80], [88], [89], [90]] not find
09150.json line idx:[[0]] not find


 76%|███████▌  | 9198/12104 [03:57<01:16, 38.13it/s]

09188.json line idx:[[10]] not find
09191.json line idx:[[49]] not find
09192.json line idx:[[31]] not find
09195.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [22], [27]] not find


 76%|███████▌  | 9203/12104 [03:57<01:21, 35.69it/s]

09201.json line idx:[[39]] not find


 76%|███████▋  | 9248/12104 [03:58<01:27, 32.54it/s]

09246.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87]] not find


 77%|███████▋  | 9347/12104 [04:01<01:03, 43.23it/s]

09344.json line idx:[[4], [5], [6], [7], [8], [9]] not find


 78%|███████▊  | 9385/12104 [04:02<01:55, 23.56it/s]

09384.json line idx:[[41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76]] not find


 78%|███████▊  | 9393/12104 [04:03<01:52, 24.03it/s]

09387.json line idx:[[0], [88], [89]] not find
09389.json line idx:[[22], [25], [63], [64], [68], [108], [110]] not find
09390.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53]] not find
09394.json line idx:[[41], [42], [64]] not find
09398.json line idx:[[0], [1], [2]] not find


 78%|███████▊  | 9408/12104 [04:03<01:17, 34.76it/s]

09405.json line idx:[[0]] not find
09406.json line idx:[[0], [1], [114], [115]] not find


 78%|███████▊  | 9426/12104 [04:03<01:19, 33.52it/s]

09418.json line idx:[[0], [1], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [39], [40], [41], [42], [43], [44], [45], [46], [55]] not find


 78%|███████▊  | 9487/12104 [04:05<01:12, 36.09it/s]

09481.json line idx:[[1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32]] not find
09483.json line idx:[[79], [80], [81], [82], [83], [84]] not find


 79%|███████▊  | 9515/12104 [04:06<00:56, 45.90it/s]

09509.json line idx:[[22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35]] not find


 79%|███████▊  | 9531/12104 [04:06<01:11, 36.18it/s]

09525.json line idx:[[12]] not find


 79%|███████▉  | 9564/12104 [04:07<01:05, 39.02it/s]

09553.json line idx:[[15]] not find


 79%|███████▉  | 9585/12104 [04:08<01:25, 29.48it/s]

09583.json line idx:[[35]] not find


 80%|████████  | 9696/12104 [04:11<01:16, 31.31it/s]

09692.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48]] not find
09695.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10]] not find


 80%|████████  | 9706/12104 [04:11<01:04, 37.03it/s]

09702.json line idx:[[1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11]] not find


 80%|████████  | 9719/12104 [04:12<01:17, 30.76it/s]

09717.json line idx:[[147], [148]] not find


 80%|████████  | 9727/12104 [04:12<01:24, 28.21it/s]

09723.json line idx:[[21], [22], [23], [26], [27], [29], [31], [34], [35], [37], [39], [41], [43], [45], [48], [49], [51], [53], [56], [57], [84], [85], [86], [87], [89], [90], [91], [92], [95], [96], [97], [98], [101], [102], [103], [104], [107], [108], [109], [110], [113], [114], [115], [116], [119], [120], [121], [122], [125], [126], [127], [128], [131], [132], [133], [134], [136], [137], [139], [140]] not find
09726.json line idx:[[0], [1], [7], [8], [9], [10], [11], [12], [16], [17], [18], [19], [24], [25], [26], [27], [32], [33], [34], [35], [40], [41], [42], [43], [50], [51], [52], [53], [54], [55], [60], [61], [62], [63], [67], [68], [69], [70], [74], [78], [81], [84], [87], [90], [93], [96], [99], [102], [105], [108], [112], [113], [116], [119], [125], [130], [131]] not find


 81%|████████  | 9745/12104 [04:13<01:22, 28.48it/s]

09751.json line idx:[[36], [51]] not find


 81%|████████  | 9787/12104 [04:13<00:41, 55.56it/s]

09781.json line idx:[[39]] not find


 81%|████████  | 9833/12104 [04:15<01:16, 29.75it/s]

09829.json line idx:[[56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69]] not find
09830.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [23], [24], [25], [26], [27], [28], [29], [30], [31], [33], [34], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [68], [69], [70], [71], [72]] not find
09832.json line idx:[[15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32]] not find


 81%|████████▏ | 9840/12104 [04:16<01:39, 22.84it/s]

09836.json line idx:[[29], [30], [31], [65]] not find
09843.json line idx:[[22], [23]] not find


 81%|████████▏ | 9859/12104 [04:16<01:17, 28.92it/s]

09853.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70]] not find


 82%|████████▏ | 9867/12104 [04:17<01:24, 26.40it/s]

09866.json layout error: cell_idx: 2, row_span: [0, 3], col_span: [2, 4]
09868.json layout error: cell_idx: 4, row_span: [0, 2], col_span: [11, 17]


 82%|████████▏ | 9919/12104 [04:18<00:34, 62.44it/s]

09915.json line idx:[[23], [26], [29], [32], [35], [38], [39], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [57], [58], [61], [64], [66], [68], [70]] not find
09921.json line idx:[[3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [164], [165], [166]] not find


 82%|████████▏ | 9927/12104 [04:18<00:38, 56.04it/s]

09922.json line idx:[[51], [88]] not find


 82%|████████▏ | 9940/12104 [04:19<00:42, 50.97it/s]

09934.json line idx:[[24], [27]] not find


 82%|████████▏ | 9969/12104 [04:20<01:08, 31.27it/s]

09966.json line idx:[[4]] not find


 83%|████████▎ | 9988/12104 [04:20<01:12, 29.32it/s]

09979.json line idx:[[0], [1]] not find


 83%|████████▎ | 10014/12104 [04:22<04:12,  8.29it/s]

10013.json line idx:[[0]] not find


 83%|████████▎ | 10024/12104 [04:23<02:42, 12.82it/s]

10016.json line idx:[[71]] not find
10026.json line idx:[[34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95], [96], [97], [98], [99], [100], [101], [102], [103], [104], [105], [106], [107], [108], [109], [110], [111], [112], [113], [114], [115], [116], [117], [118], [119], [120], [121], [122], [123], [124], [125], [126], [127], [128], [129], [130], [131], [132], [133], [134], [135], [136], [137], [138], [139], [140], [141], [142], [143], [144], [145], [146], [147], [148], [149], [150], [151], [152], [153], [154], [155], [156], [157], [158], [159], [160], [161], [162], [163], [164], [165], [166], [167], [168], [169], [170], [171], [172], [173], [174], [175], [176], [186], [

 83%|████████▎ | 10070/12104 [04:25<01:02, 32.74it/s]

10063.json line idx:[[62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72]] not find
10069.json line idx:[[5]] not find


 84%|████████▎ | 10126/12104 [04:26<00:57, 34.38it/s]

10120.json line idx:[[0]] not find


 84%|████████▍ | 10143/12104 [04:27<01:07, 29.03it/s]

10138.json line idx:[[9], [13], [17], [38], [42], [46], [47], [51]] not find
10145.json line idx:[[8]] not find


 84%|████████▍ | 10162/12104 [04:28<01:17, 25.12it/s]

10157.json line idx:[[0], [1], [2], [3], [4], [5], [6]] not find


 84%|████████▍ | 10172/12104 [04:28<01:01, 31.17it/s]

10164.json line idx:[[27]] not find


 84%|████████▍ | 10212/12104 [04:29<00:35, 52.93it/s]

10209.json line idx:[[45], [46], [47], [48]] not find
10213.json line idx:[[20]] not find


 84%|████████▍ | 10220/12104 [04:29<00:41, 45.37it/s]

10220.json line idx:[[15], [16], [17], [18], [19], [20]] not find


 85%|████████▍ | 10239/12104 [04:30<00:56, 33.28it/s]

10228.json line idx:[[15], [16], [17], [18], [22]] not find
10229.json line idx:[[18], [24]] not find


 85%|████████▍ | 10271/12104 [04:31<01:03, 28.66it/s]

10266.json line idx:[[6], [7], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90]] not find
10267.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95], [96], [97], [98], [99], [100], [101]] not find
10270.js

 85%|████████▍ | 10284/12104 [04:32<00:59, 30.58it/s]

10277.json line idx:[[0], [1]] not find
10280.json line idx:[[69]] not find


 85%|████████▌ | 10305/12104 [04:33<01:07, 26.48it/s]

10300.json layout error: cell_idx: 0, row_span: [0, 2], col_span: [0, 8]


 85%|████████▌ | 10318/12104 [04:33<01:17, 22.93it/s]

10318.json line idx:[[6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87]] not find


 86%|████████▌ | 10350/12104 [04:35<00:56, 31.11it/s]

10329.json line idx:[[363]] not find
10351.json line idx:[[1], [2], [3], [4], [5], [6], [7], [15], [22]] not find


 86%|████████▌ | 10368/12104 [04:35<00:43, 39.72it/s]

10370.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22]] not find


 86%|████████▌ | 10428/12104 [04:37<00:44, 37.33it/s]

10425.json line idx:[[15], [16], [17], [20], [22], [23], [24], [36], [37], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65]] not find
10428.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10]] not find


 86%|████████▋ | 10449/12104 [04:38<01:03, 25.93it/s]

10444.json line idx:[[0], [1], [2], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [38], [39], [40], [41], [42], [44], [45], [46], [47], [48], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59]] not find


 87%|████████▋ | 10483/12104 [04:39<00:33, 47.86it/s]

10463.json line idx:[[24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88]] not find


 87%|████████▋ | 10501/12104 [04:39<00:21, 76.04it/s]

10501.json line idx:[[0], [1], [2], [3], [4], [5], [7]] not find


 87%|████████▋ | 10539/12104 [04:41<00:44, 35.50it/s]

10538.json line idx:[[42]] not find


 87%|████████▋ | 10557/12104 [04:41<00:59, 26.08it/s]

10554.json line idx:[[0]] not find
10555.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90], [91], [92]] not find
10562.json line idx:[[0], [1], [3], [4], [5], [6], [7], [8], [24], [25], [26], [27], [28], [29], [30], [31], [64], [65], [66], [67], [100], [101], [102], [103], [104], [105], [106], [107], [108], [125], [126]] not find


 87%|████████▋ | 10571/12104 [04:42<00:38, 39.36it/s]

10566.json line idx:[[0], [1], [2], [3], [4], [5], [6]] not find


 88%|████████▊ | 10593/12104 [04:43<01:09, 21.89it/s]

10591.json line idx:[[189]] not find


 88%|████████▊ | 10606/12104 [04:43<00:54, 27.68it/s]

10603.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12]] not find


 88%|████████▊ | 10650/12104 [04:43<00:15, 93.63it/s]

10614.json line idx:[[49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59]] not find
10619.json line idx:[[7], [8]] not find


 88%|████████▊ | 10662/12104 [04:44<00:17, 80.84it/s]

10651.json line idx:[[0], [4], [9], [15], [17], [23], [27], [31]] not find
10653.json line idx:[[29], [45]] not find


 88%|████████▊ | 10672/12104 [04:44<00:19, 71.66it/s]

10663.json line idx:[[0], [1], [2], [3], [4], [75], [76]] not find
10664.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25]] not find
10668.json line idx:[[13], [14]] not find


 88%|████████▊ | 10707/12104 [04:45<00:39, 35.73it/s]

10702.json line idx:[[0], [11], [47], [48]] not find


 89%|████████▊ | 10724/12104 [04:45<00:32, 42.93it/s]

10719.json line idx:[[13], [14], [41], [42], [43], [83], [84], [85], [86], [87]] not find
10723.json line idx:[[28], [29], [30], [31]] not find
10725.json line idx:[[7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19]] not find


 89%|████████▊ | 10739/12104 [04:46<00:40, 33.64it/s]

10741.json line idx:[[13], [15], [17], [20], [21], [23], [25], [27], [29], [31], [33], [35], [37], [39], [41], [43], [44], [46], [48], [51], [52], [55], [58], [59], [60], [62], [64], [66], [68], [70], [72], [74], [76]] not find


 89%|████████▉ | 10801/12104 [04:48<00:33, 39.20it/s]

10801.json line idx:[[20]] not find


 89%|████████▉ | 10827/12104 [04:48<00:28, 44.55it/s]

10816.json line idx:[[54]] not find


 90%|████████▉ | 10842/12104 [04:49<00:42, 29.52it/s]

10838.json line idx:[[0]] not find
10841.json line idx:[[34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84]] not find


 90%|████████▉ | 10846/12104 [04:49<00:50, 24.73it/s]

10845.json line idx:[[23], [24], [33], [34], [35], [45], [51], [58], [66], [73], [79], [80], [90], [91], [98], [99], [106], [107], [114], [133]] not find


 90%|████████▉ | 10865/12104 [04:50<00:49, 24.79it/s]

10853.json line idx:[[0], [1], [39], [40], [41], [42], [43]] not find
10857.json line idx:[[0], [1], [2], [3], [4]] not find
10861.json line idx:[[30], [32], [33], [34], [37], [38], [45], [46], [47]] not find


 90%|████████▉ | 10888/12104 [04:51<00:53, 22.53it/s]

10883.json line idx:[[56]] not find


 90%|█████████ | 10904/12104 [04:52<00:47, 25.43it/s]

10898.json line idx:[[75], [76]] not find


 90%|█████████ | 10947/12104 [04:53<00:30, 38.18it/s]

10940.json line idx:[[2], [3], [4], [5], [18], [19], [75], [76], [77], [82]] not find


 90%|█████████ | 10953/12104 [04:53<00:29, 39.25it/s]

10950.json line idx:[[0]] not find


 91%|█████████ | 10999/12104 [04:56<00:42, 25.89it/s]

10992.json line idx:[[49], [52], [53], [55], [56], [59], [60], [63], [108], [109], [110], [111]] not find


 91%|█████████ | 11010/12104 [04:56<00:30, 35.62it/s]

11001.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [27], [28], [30], [31], [33], [35], [37], [39], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89]] not find
11008.json line idx:[[0]] not find


 91%|█████████ | 11021/12104 [04:56<00:27, 38.78it/s]

11016.json line idx:[[3]] not find
11020.json line idx:[[52]] not find


 91%|█████████ | 11030/12104 [04:56<00:34, 30.77it/s]

11026.json line idx:[[0], [1]] not find


 91%|█████████▏| 11049/12104 [04:57<00:29, 35.24it/s]

11040.json line idx:[[10]] not find
11043.json line idx:[[24], [25], [81], [82]] not find


 92%|█████████▏| 11077/12104 [04:57<00:12, 81.39it/s]

11077.json line idx:[[0], [9], [21], [36], [37], [62], [63]] not find


 92%|█████████▏| 11093/12104 [04:58<00:27, 36.21it/s]

11096.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [62], [63], [66], [67], [68], [70], [71], [72], [73], [74], [75], [76]] not find


 92%|█████████▏| 11114/12104 [04:59<00:29, 33.33it/s]

11109.json line idx:[[51]] not find


 92%|█████████▏| 11153/12104 [05:00<00:42, 22.22it/s]

11148.json line idx:[[25], [51]] not find


 92%|█████████▏| 11172/12104 [05:01<00:30, 30.26it/s]

11166.json line idx:[[0], [1], [38], [39], [40]] not find


 92%|█████████▏| 11184/12104 [05:01<00:31, 28.79it/s]

11177.json line idx:[[10], [11], [38], [39], [44], [45], [56], [57], [82], [83], [108], [109], [120], [121], [143], [144]] not find
11180.json line idx:[[17]] not find


 92%|█████████▏| 11188/12104 [05:02<00:44, 20.43it/s]

11186.json line idx:[[65], [66], [92], [93], [117], [118]] not find


 93%|█████████▎| 11202/12104 [05:02<00:34, 26.16it/s]

11198.json line idx:[[3], [4], [7], [8], [11], [12], [13], [14], [15], [18], [19], [20], [21], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95], [96], [97], [98], [99], [100], [101], [102], [103], [104], [105], [106], [107], [108], [109], [110], [111], [112], [113], [114], [115], [116], [117], [118], [119], [120], [121], [122], [123], [124], [125], [126], [127], [128], [129], [130], [134], [135], [136], [137], [138], [139], [140], [141], [142], [143], [144], [145], [146], [147], [148], [149]] not find
11200.json line idx:[[1], [2], [3], [4], [5], [6], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], 

 93%|█████████▎| 11257/12104 [05:03<00:19, 43.16it/s]

11261.json line idx:[[166], [167]] not find


 93%|█████████▎| 11269/12104 [05:05<00:48, 17.28it/s]

11263.json line idx:[[11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51]] not find


 93%|█████████▎| 11297/12104 [05:06<00:30, 26.16it/s]

11295.json line idx:[[17], [18], [19], [20]] not find


 93%|█████████▎| 11302/12104 [05:06<00:46, 17.18it/s]

11299.json line idx:[[0]] not find


 93%|█████████▎| 11311/12104 [05:06<00:34, 22.83it/s]

11305.json line idx:[[5]] not find


 94%|█████████▎| 11328/12104 [05:07<00:34, 22.59it/s]

11327.json line idx:[[12], [13]] not find


 94%|█████████▍| 11357/12104 [05:08<00:16, 46.33it/s]

11339.json line idx:[[10], [11], [12], [13], [16], [17], [18], [20], [21], [22], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34]] not find


 94%|█████████▍| 11373/12104 [05:08<00:13, 54.56it/s]

11363.json line idx:[[38], [58]] not find
11364.json line idx:[[19], [20]] not find


 94%|█████████▍| 11409/12104 [05:09<00:17, 39.77it/s]

11400.json line idx:[[58]] not find


 94%|█████████▍| 11414/12104 [05:10<00:24, 28.46it/s]

11416.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95], [96], [97], [98], [99], [100], [101], [102], [103], [104], [105], [106], [107], [108], [109], [110], [111], [112], [113], [114], [115], [116], [117], [118], [119], [120], [121], [122], [123], [124], [125], [126], [127], [128], [129], [130], [131], [132], [133], [134], [135], [136], [137], [138], [139], [140], [141], [142], [143], [144], [145], [146], [147], [148], [149], [150], [151], [152], [153], [154]] not find


 94%|█████████▍| 11424/12104 [05:10<00:34, 19.67it/s]

11420.json line idx:[[2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [85], [86], [87], [88], [89], [90], [91], [92], [93], [94], [95], [96], [97], [98], [99], [100], [101], [102], [103], [104]] not find


 94%|█████████▍| 11436/12104 [05:11<00:21, 31.01it/s]

11428.json line idx:[[2], [10], [15], [24]] not find
11432.json line idx:[[0], [1], [2], [68], [69]] not find


 95%|█████████▍| 11443/12104 [05:11<00:17, 37.98it/s]

11443.json line idx:[[1], [2], [3], [4], [5]] not find


 95%|█████████▍| 11460/12104 [05:11<00:19, 33.58it/s]

11454.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67]] not find


 95%|█████████▌| 11506/12104 [05:12<00:08, 73.69it/s]

11510.json line idx:[[0], [1], [3], [4]] not find


 95%|█████████▌| 11522/12104 [05:13<00:17, 33.47it/s]

11512.json line idx:[[263], [429]] not find


 95%|█████████▌| 11543/12104 [05:14<00:15, 35.85it/s]

11532.json line idx:[[30]] not find


 96%|█████████▌| 11560/12104 [05:14<00:14, 38.57it/s]

11553.json line idx:[[15], [16], [17]] not find


 96%|█████████▌| 11569/12104 [05:15<00:18, 28.56it/s]

11566.json line idx:[[0], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84]] not find


 96%|█████████▌| 11573/12104 [05:15<00:21, 24.87it/s]

11572.json line idx:[[44], [60], [61], [62], [64], [65], [66], [69], [70], [71], [72], [73], [130], [131], [132], [133], [134], [135]] not find


 96%|█████████▌| 11592/12104 [05:16<00:21, 23.36it/s]

11588.json line idx:[[191], [192], [193]] not find


 96%|█████████▌| 11604/12104 [05:16<00:18, 27.29it/s]

11598.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [80], [81], [82], [83], [84], [85], [104], [105], [106], [107], [108], [109], [110], [111], [112], [113], [114], [115], [116], [117], [118], [119], [120], [121], [122], [123], [124], [146]] not find


 96%|█████████▌| 11608/12104 [05:16<00:18, 26.13it/s]

11606.json line idx:[[0]] not find
11608.json line idx:[[86], [87], [88], [89]] not find


 96%|█████████▋| 11659/12104 [05:18<00:12, 36.05it/s]

11653.json line idx:[[0], [2], [5], [7], [9], [10], [11], [41], [42]] not find


 97%|█████████▋| 11713/12104 [05:20<00:13, 28.47it/s]

11709.json line idx:[[5], [7], [8], [9], [10], [11], [12], [13]] not find
11712.json line idx:[[36], [37], [38], [39], [40], [41], [42]] not find


 97%|█████████▋| 11724/12104 [05:20<00:12, 30.69it/s]

11720.json line idx:[[25], [26], [52], [53]] not find
11721.json layout error: cell_idx: 0, row_span: [0, 2], col_span: [0, 10]


 97%|█████████▋| 11739/12104 [05:20<00:08, 44.42it/s]

11735.json line idx:[[0], [1], [2], [3], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51]] not find


 97%|█████████▋| 11749/12104 [05:21<00:11, 32.08it/s]

11745.json line idx:[[20], [21], [22], [23], [52], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [88], [89], [90], [91], [92], [93], [94], [95], [96], [97], [98], [99], [100], [101], [102], [103], [104], [105], [106], [107], [108], [109], [110], [111], [112], [113], [114], [115], [116], [117], [118], [119], [120], [121], [122], [123], [124], [125], [126], [127], [128], [129], [130], [131], [132], [133], [134], [135], [136], [137], [138], [139], [140], [141], [142], [143], [144], [145], [146]] not find


 97%|█████████▋| 11760/12104 [05:21<00:11, 28.67it/s]

11758.json line idx:[[0], [1], [32], [33], [67], [68], [69]] not find


 97%|█████████▋| 11780/12104 [05:22<00:08, 37.64it/s]

11774.json line idx:[[38], [39], [40], [41], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [64], [65], [66], [67], [68], [69], [70], [71], [72], [73], [74], [75], [76], [77], [78], [79], [80], [81], [82], [83], [84], [89], [90], [91], [92], [94], [95], [96], [139], [140], [141], [142], [143], [144], [145], [146], [147], [150], [151], [152], [153], [154], [155], [156], [157], [158], [159], [162], [163], [164], [165], [166], [167], [168], [169], [171], [172]] not find


 98%|█████████▊| 11845/12104 [05:23<00:05, 48.61it/s]

11834.json line idx:[[2]] not find


 98%|█████████▊| 11889/12104 [05:24<00:07, 27.20it/s]

11882.json line idx:[[0]] not find


 99%|█████████▉| 11992/12104 [05:28<00:03, 33.46it/s]

11988.json line idx:[[25], [26]] not find
11992.json line idx:[[28], [79], [90]] not find


 99%|█████████▉| 12006/12104 [05:28<00:03, 27.61it/s]

12004.json line idx:[[57]] not find
12006.json line idx:[[275]] not find


 99%|█████████▉| 12013/12104 [05:29<00:03, 23.17it/s]

12009.json line idx:[[0], [1], [2], [3], [4], [5], [6], [8], [9], [10], [11], [12], [13], [14], [15]] not find


 99%|█████████▉| 12028/12104 [05:29<00:02, 37.18it/s]

12022.json line idx:[[90], [91], [92], [93], [94], [95], [96], [97], [98], [99], [100], [101], [102], [103], [104], [105], [106], [107], [108], [109], [110], [111], [112], [113], [114], [115], [116], [117], [118], [119], [120], [121], [122], [123], [124], [125], [126], [127], [128], [129], [130], [131], [132], [133], [134]] not find
12025.json line idx:[[0], [1], [2], [3], [4], [5], [6], [7], [8], [9], [10], [11], [12], [13], [14], [15], [16], [17], [18], [19], [20], [21], [22], [23], [24], [25], [26], [27], [28], [29], [30], [31], [32], [33], [34], [35], [36], [37], [38], [39], [40], [41], [42], [43], [44], [45], [46], [47], [48], [49], [50], [51], [52], [53], [54], [55], [56], [57], [58], [59], [60], [61], [62], [63], [64]] not find


 99%|█████████▉| 12037/12104 [05:30<00:02, 23.24it/s]

12035.json line idx:[[49]] not find


100%|█████████▉| 12074/12104 [05:31<00:00, 38.84it/s]

12058.json line idx:[[7], [8], [9], [10], [11]] not find


100%|██████████| 12104/12104 [05:32<00:00, 36.45it/s]

12077.json line idx:[[434]] not find
12094.json line idx:[[10]] not find
12099.json layout error: cell_idx: 3, row_span: [1, 6], col_span: [1, 3]
table error: 447



