Docgenie-API / scripts /data /prepare_alpha_sampling_datasets.sh
Ahadhassan-2003
deploy: update HF Space
5c36ec7
#!/bin/bash
declare datasets=(
"rvlcdip_alpha=0.5_v1"
"rvlcdip_alpha=0.75_v1"
"rvlcdip_alpha=1.0_v1"
"rvlcdip_alpha=0.5" # this is v2
"rvlcdip_alpha=0.75" # this is v2
"rvlcdip_alpha=1.0" # this is v2
"docvqa_alpha=0.5_v1"
"docvqa_alpha=0.75_v1"
"docvqa_alpha=1.0_v1"
"docvqa_alpha=0.5" # this is v2
"docvqa_alpha=0.75" # this is v2
"docvqa_alpha=1.0" # this is v2
"cord_alpha=0.5_v1"
"cord_alpha=0.75_v1"
"cord_alpha=1.0_v1"
"cord_alpha=0.5" # this is v2
"cord_alpha=0.75" # this is v2
"cord_alpha=1.0" # this is v2
"publaynet_correct-sampling_alpha=0.5_v1"
"publaynet_correct-sampling_alpha=0.75_v1"
"publaynet_correct-sampling_alpha=1.0_v1"
"publaynet_correct-sampling_alpha=0.5" # this is v2
"publaynet_correct-sampling_alpha=0.75" # this is v2
"publaynet_correct-sampling_alpha=1.0" # this is v2
)
for dataset in "${datasets[@]}"; do
echo "Preparing synthetic dataset: ${dataset}"
python docgenie/data/cmds/prepare_synth_datasets.py --dataset-name ${dataset} $@
done