File size: 657 Bytes
5c36ec7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
#!/bin/bash

declare datasets=(
    # classification
    "rvlcdip_alpha=1.0"
    "tobacco3482_alpha=1.0"
    "doclaynet4k_alpha=1.0_CLS"

    # docvqa
    "docvqa_alpha=1.0"
    "wtq_alpha=1.0"

    # kie
    "cord_alpha=1.0"
    "funsd_alpha=1.0"
    "kleister_alpha=1.0"
    "sroie_alpha=1.0"

    # # layout analysis
    "publaynet_correct-sampling_alpha=1.0"
    "icdar2019_alpha=1.0"
    "doclaynet4k_alpha=1.0_DLA --clip-bboxes-to-foreground"
)

for dataset in "${datasets[@]}"; do
    echo "Preparing synthetic dataset: ${dataset}"
    python docgenie/data/cmds/prepare_synth_datasets.py --dataset-name ${dataset} $@
done