Spaces:
AIR-Bench
/
Running on CPU Upgrade

hanhainebula commited on
Commit
ca2a141
1 Parent(s): d27648d

Modify the commands of evaluating

Browse files
Files changed (1) hide show
  1. src/about.py +91 -84
src/about.py CHANGED
@@ -30,109 +30,116 @@ pip install .
30
  ```bash
31
  cd AIR-Bench/scripts
32
  # Run all tasks
33
- python run_AIR-Bench.py \
34
- --output_dir ./search_results \
35
  --encoder BAAI/bge-m3 \
36
- --encoder_link https://huggingface.co/BAAI/bge-m3 \
37
- --reranker BAAI/bge-reranker-v2-m3 \
38
- --reranker_link https://huggingface.co/BAAI/bge-reranker-v2-m3 \
39
- --search_top_k 1000 \
40
- --rerank_top_k 100 \
41
- --max_query_length 512 \
42
- --max_passage_length 512 \
43
- --batch_size 512 \
44
- --pooling_method cls \
45
- --normalize_embeddings True \
46
- --use_fp16 True \
47
- --add_instruction False \
48
  --overwrite False
49
 
50
  # Run the tasks in the specified task type
51
- python run_AIR-Bench.py \
52
- --task_types long-doc \
53
- --output_dir ./search_results \
54
- --encoder BAAI/bge-m3 \
55
- --encoder_link https://huggingface.co/BAAI/bge-m3 \
56
- --reranker BAAI/bge-reranker-v2-m3 \
57
- --reranker_link https://huggingface.co/BAAI/bge-reranker-v2-m3 \
58
- --search_top_k 1000 \
59
- --rerank_top_k 100 \
60
- --max_query_length 512 \
61
- --max_passage_length 512 \
62
- --batch_size 512 \
63
- --pooling_method cls \
64
- --normalize_embeddings True \
65
- --use_fp16 True \
66
- --add_instruction False \
67
  --overwrite False
68
 
69
  # Run the tasks in the specified task type and domains
70
- python run_AIR-Bench.py \
71
- --task_types long-doc \
72
- --domains arxiv book \
73
- --output_dir ./search_results \
74
- --encoder BAAI/bge-m3 \
75
- --encoder_link https://huggingface.co/BAAI/bge-m3 \
76
- --reranker BAAI/bge-reranker-v2-m3 \
77
- --reranker_link https://huggingface.co/BAAI/bge-reranker-v2-m3 \
78
- --search_top_k 1000 \
79
- --rerank_top_k 100 \
80
- --max_query_length 512 \
81
- --max_passage_length 512 \
82
- --batch_size 512 \
83
- --pooling_method cls \
84
- --normalize_embeddings True \
85
- --use_fp16 True \
86
- --add_instruction False \
87
  --overwrite False
88
 
89
  # Run the tasks in the specified languages
90
- python run_AIR-Bench.py \
91
- --languages en \
92
- --output_dir ./search_results \
93
- --encoder BAAI/bge-m3 \
94
- --encoder_link https://huggingface.co/BAAI/bge-m3 \
95
- --reranker BAAI/bge-reranker-v2-m3 \
96
- --reranker_link https://huggingface.co/BAAI/bge-reranker-v2-m3 \
97
- --search_top_k 1000 \
98
- --rerank_top_k 100 \
99
- --max_query_length 512 \
100
- --max_passage_length 512 \
101
- --batch_size 512 \
102
- --pooling_method cls \
103
- --normalize_embeddings True \
104
- --use_fp16 True \
105
- --add_instruction False \
106
  --overwrite False
107
 
108
  # Run the tasks in the specified task type, domains, and languages
109
- python run_AIR-Bench.py \
110
- --task_types qa \
111
- --domains wiki web \
112
- --languages en \
113
- --output_dir ./search_results \
114
- --encoder BAAI/bge-m3 \
115
- --encoder_link https://huggingface.co/BAAI/bge-m3 \
116
- --reranker BAAI/bge-reranker-v2-m3 \
117
- --reranker_link https://huggingface.co/BAAI/bge-reranker-v2-m3 \
118
- --search_top_k 1000 \
119
- --rerank_top_k 100 \
120
- --max_query_length 512 \
121
- --max_passage_length 512 \
122
- --batch_size 512 \
123
- --pooling_method cls \
124
- --normalize_embeddings True \
125
- --use_fp16 True \
126
- --add_instruction False \
127
  --overwrite False
128
  ```
129
  3. Package the search results.
130
  ```bash
 
131
  python zip_results.py \
132
- --results_path search_results/bge-m3 \
133
- --save_path search_results/zipped_results
 
 
 
 
 
 
 
 
134
  ```
135
- 4. Upload the `.zip` file on this page and fill in the model information.
 
 
 
 
 
 
136
  5. Congratulation! Your results will be shown on the leaderboard in up to one hour.
137
  """
138
 
 
30
  ```bash
31
  cd AIR-Bench/scripts
32
  # Run all tasks
33
+ python run_AIR-Bench.py \\
34
+ --output_dir ./search_results \\
35
  --encoder BAAI/bge-m3 \
36
+ --reranker BAAI/bge-reranker-v2-m3 \\
37
+ --search_top_k 1000 \\
38
+ --rerank_top_k 100 \\
39
+ --max_query_length 512 \\
40
+ --max_passage_length 512 \\
41
+ --batch_size 512 \\
42
+ --pooling_method cls \\
43
+ --normalize_embeddings True \\
44
+ --use_fp16 True \\
45
+ --add_instruction False \\
 
 
46
  --overwrite False
47
 
48
  # Run the tasks in the specified task type
49
+ python run_AIR-Bench.py \\
50
+ --task_types long-doc \\
51
+ --output_dir ./search_results \\
52
+ --encoder BAAI/bge-m3 \\
53
+ --reranker BAAI/bge-reranker-v2-m3 \\
54
+ --search_top_k 1000 \\
55
+ --rerank_top_k 100 \\
56
+ --max_query_length 512 \\
57
+ --max_passage_length 512 \\
58
+ --batch_size 512 \\
59
+ --pooling_method cls \\
60
+ --normalize_embeddings True \\
61
+ --use_fp16 True \\
62
+ --add_instruction False \\
 
 
63
  --overwrite False
64
 
65
  # Run the tasks in the specified task type and domains
66
+ python run_AIR-Bench.py \\
67
+ --task_types long-doc \\
68
+ --domains arxiv book \\
69
+ --output_dir ./search_results \\
70
+ --encoder BAAI/bge-m3 \\
71
+ --reranker BAAI/bge-reranker-v2-m3 \\
72
+ --search_top_k 1000 \\
73
+ --rerank_top_k 100 \\
74
+ --max_query_length 512 \\
75
+ --max_passage_length 512 \\
76
+ --batch_size 512 \\
77
+ --pooling_method cls \\
78
+ --normalize_embeddings True \\
79
+ --use_fp16 True \\
80
+ --add_instruction False \\
 
 
81
  --overwrite False
82
 
83
  # Run the tasks in the specified languages
84
+ python run_AIR-Bench.py \\
85
+ --languages en \\
86
+ --output_dir ./search_results \\
87
+ --encoder BAAI/bge-m3 \\
88
+ --reranker BAAI/bge-reranker-v2-m3 \\
89
+ --search_top_k 1000 \\
90
+ --rerank_top_k 100 \\
91
+ --max_query_length 512 \\
92
+ --max_passage_length 512 \\
93
+ --batch_size 512 \\
94
+ --pooling_method cls \\
95
+ --normalize_embeddings True \\
96
+ --use_fp16 True \\
97
+ --add_instruction False \\
 
 
98
  --overwrite False
99
 
100
  # Run the tasks in the specified task type, domains, and languages
101
+ python run_AIR-Bench.py \\
102
+ --task_types qa \\
103
+ --domains wiki web \\
104
+ --languages en \\
105
+ --output_dir ./search_results \\
106
+ --encoder BAAI/bge-m3 \\
107
+ --encoder_link https://huggingface.co/BAAI/bge-m3 \\
108
+ --reranker BAAI/bge-reranker-v2-m3 \\
109
+ --reranker_link https://huggingface.co/BAAI/bge-reranker-v2-m3 \\
110
+ --search_top_k 1000 \\
111
+ --rerank_top_k 100 \\
112
+ --max_query_length 512 \\
113
+ --max_passage_length 512 \\
114
+ --batch_size 512 \\
115
+ --pooling_method cls \\
116
+ --normalize_embeddings True \\
117
+ --use_fp16 True \\
118
+ --add_instruction False \\
119
  --overwrite False
120
  ```
121
  3. Package the search results.
122
  ```bash
123
+ # Zip "Embedding Model + NoReranker" search results in "<search_results>/<model_name>/NoReranker" to "<save_dir>/<model_name>_NoReranker.zip".
124
  python zip_results.py \
125
+ --results_dir search_results \
126
+ --model_name bge-m3 \
127
+ --save_dir search_results/zipped_results
128
+
129
+ # Zip "Embedding Model + Reranker" search results in "<search_results>/<model_name>/<reranker_name>" to "<save_dir>/<model_name>_<reranker_name>.zip".
130
+ python zip_results.py \
131
+ --results_path search_results \
132
+ --model_name bge-m3 \
133
+ --reranker_name bge-reranker-v2-m3 \
134
+ --save_dir search_results/zipped_results
135
  ```
136
+ 4. Upload the `.zip` file on this page and fill in the model information:
137
+ - Model Name: such as `bge-m3`.
138
+ - Model URL: such as `https://huggingface.co/BAAI/bge-m3`.
139
+ - Reranker Name: such as `bge-reranker-v2-m3`. Keep empty for `NoReranker`.
140
+ - Reranker URL: such as `https://huggingface.co/BAAI/bge-reranker-v2-m3`. Keep empty for `NoReranker`.
141
+
142
+ If you want to stay anonymous, you can only fill in the Model Name and Reranker Name (keep empty for `NoReranker`), and check the selection box below befor submission.
143
  5. Congratulation! Your results will be shown on the leaderboard in up to one hour.
144
  """
145