Vishwas1 commited on
Commit
3a4bc44
·
verified ·
1 Parent(s): 93a2c3f

Update train_model.py

Browse files
Files changed (1) hide show
  1. train_model.py +2 -1
train_model.py CHANGED
@@ -100,7 +100,8 @@ def initialize_model(task, model_name, vocab_size, sequence_length, hidden_size,
100
  num_attention_heads=attention_heads,
101
  intermediate_size=4 * hidden_size,
102
  hidden_act='gelu',
103
- use_cache=True
 
104
  )
105
  model = GPT2LMHeadModel(config)
106
  logging.info("GPT2LMHeadModel initialized successfully.")
 
100
  num_attention_heads=attention_heads,
101
  intermediate_size=4 * hidden_size,
102
  hidden_act='gelu',
103
+ use_cache=True,
104
+ truncation=False
105
  )
106
  model = GPT2LMHeadModel(config)
107
  logging.info("GPT2LMHeadModel initialized successfully.")