lhallee commited on
Commit
5fa2ec2
·
verified ·
1 Parent(s): 469a1e6

Upload modeling_esm_plusplus.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. modeling_esm_plusplus.py +1 -2
modeling_esm_plusplus.py CHANGED
@@ -597,7 +597,7 @@ class ProteinDataset(TorchDataset):
597
  def build_collator(tokenizer) -> Callable[[list[str]], tuple[torch.Tensor, torch.Tensor]]:
598
  def _collate_fn(sequences: list[str]) -> tuple[torch.Tensor, torch.Tensor]:
599
  """Collate function for batching sequences."""
600
- return tokenizer(sequences, return_tensors="pt", padding='longest', pad_to_multiple_of=8)
601
  return _collate_fn
602
 
603
 
@@ -755,7 +755,6 @@ class EmbeddingMixin:
755
 
756
  return embeddings_dict
757
 
758
-
759
  class PreTrainedESMplusplusModel(PreTrainedModel):
760
  """
761
  init weights for ESM++ models
 
597
  def build_collator(tokenizer) -> Callable[[list[str]], tuple[torch.Tensor, torch.Tensor]]:
598
  def _collate_fn(sequences: list[str]) -> tuple[torch.Tensor, torch.Tensor]:
599
  """Collate function for batching sequences."""
600
+ return tokenizer(sequences, return_tensors="pt", padding='longest')
601
  return _collate_fn
602
 
603
 
 
755
 
756
  return embeddings_dict
757
 
 
758
  class PreTrainedESMplusplusModel(PreTrainedModel):
759
  """
760
  init weights for ESM++ models