davanstrien HF Staff commited on
Commit
d1489e3
·
1 Parent(s): d7ac8e4

remove flashinfer

Browse files
Files changed (1) hide show
  1. generate_summaries_uv.py +1 -2
generate_summaries_uv.py CHANGED
@@ -2,7 +2,6 @@
2
  # requires-python = ">=3.10"
3
  # dependencies = [
4
  # "datasets",
5
- # "flashinfer-python",
6
  # "hf_transfer",
7
  # "huggingface-hub[hf_xet]",
8
  # "polars",
@@ -21,7 +20,7 @@ from typing import Optional
21
 
22
  # Set environment variables to speed up model loading
23
  os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"
24
- os.environ["VLLM_ATTENTION_BACKEND"] = "FLASHINFER"
25
 
26
  import polars as pl
27
  from datasets import Dataset, load_dataset
 
2
  # requires-python = ">=3.10"
3
  # dependencies = [
4
  # "datasets",
 
5
  # "hf_transfer",
6
  # "huggingface-hub[hf_xet]",
7
  # "polars",
 
20
 
21
  # Set environment variables to speed up model loading
22
  os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"
23
+ # Note: VLLM will auto-select the best available attention backend
24
 
25
  import polars as pl
26
  from datasets import Dataset, load_dataset