File size: 1,414 Bytes
07d2942
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
start_index=0
total_files=0
wait_time_in_seconds=10
for i in $(seq $start_index $total_files); do
    # data_dir="data"/"gpt-4o-mini"/"output_0402_1_篩選結果.xlsx - Sheet1_$i"
    # data_dir="data"/"gpt-4o-mini"/"output_0402_2_篩選結果.xlsx - Sheet1_$i"
    data_dir="data"/"gpt-4o-mini"/"output_0402_3_篩選結果.xlsx - Sheet1_$i"
    # data_dir="data"/"gpt-4o-mini"/"output_0402_4_篩選結果.xlsx - Sheet1_$i"
    # data_dir="data/tmp"

    # echo "Preparing batch data ..."
    # python batch.py -t prepare_regularization \
    #     -erp "$data_dir"/extracted_results.joblib \
    #     -o "$data_dir"/regularization.jsonl
    #     -topn 200

    # echo "Executing batch data ..."
    # python batch.py -t run_batch \
    #     -i "$data_dir"/regularization.jsonl \
    #     -j "$data_dir"/reg_job.joblib \
    #     -jp "$data_dir"/reg_output.jsonl

    # echo "Converting batch to extracted results ..."
    # python model.py -t batch2extract \
    #     -jp "$data_dir"/output.jsonl \
    #     -crp "$data_dir"/crawled_results.joblib \
    #     -erp "$data_dir"/extracted_results.joblib

    echo "Converting batch to regularized results ..."
    python batch.py -t batch2reg \
        -jp "$data_dir"/reg_output.jsonl \
        -erp "$data_dir"/extracted_results.joblib \
        -rrp "$data_dir"/regularized_results.joblib

    sleep $wait_time_in_seconds
done

echo "All tasks completed."