eljanmahammadli commited on
Commit
7c28462
1 Parent(s): a00beed

integrated isolation regression calibration to the bc model

Browse files
Files changed (1) hide show
  1. predictors.py +11 -7
predictors.py CHANGED
@@ -269,19 +269,23 @@ def predict_bc_scores(input):
269
  samples_len_bc = len(split_text_allow_complete_sentences_nltk(input, type_det="bc"))
270
  segments_bc = split_text_allow_complete_sentences_nltk(input, type_det="bc")
271
  for i in range(samples_len_bc):
272
- cleaned_text_bc = remove_special_characters(segments_bc[i])
 
 
 
 
 
273
  bc_score = predict_bc(text_bc_model, text_bc_tokenizer, cleaned_text_bc)
274
  bc_scores.append(bc_score)
275
  bc_scores_array = np.array(bc_scores)
276
  average_bc_scores = np.mean(bc_scores_array, axis=0)
277
  bc_score_list = average_bc_scores.tolist()
278
- bc_score = {"AI": bc_score_list[1], "HUMAN": bc_score_list[0]}
279
- # print(f"Original BC scores: AI: {bc_score_list[1]}, HUMAN: {bc_score_list[0]}")
280
  # isotonic regression calibration
281
- # ai_score = iso_reg.predict([bc_score_list[1]])[0]
282
- # human_score = 1 - ai_score
283
- # bc_score = {"AI": ai_score, "HUMAN": human_score}
284
- # print(f"Calibration BC scores: AI: {ai_score}, HUMAN: {human_score}")
285
  return bc_score
286
 
287
 
 
269
  samples_len_bc = len(split_text_allow_complete_sentences_nltk(input, type_det="bc"))
270
  segments_bc = split_text_allow_complete_sentences_nltk(input, type_det="bc")
271
  for i in range(samples_len_bc):
272
+
273
+ cleaned_text_bc = (
274
+ segments_bc[i].replace("<s>", "").replace("</s>", "")
275
+ ) # this is caused by above
276
+
277
+ cleaned_text_bc = remove_special_characters(cleaned_text_bc)
278
  bc_score = predict_bc(text_bc_model, text_bc_tokenizer, cleaned_text_bc)
279
  bc_scores.append(bc_score)
280
  bc_scores_array = np.array(bc_scores)
281
  average_bc_scores = np.mean(bc_scores_array, axis=0)
282
  bc_score_list = average_bc_scores.tolist()
283
+ print(f"Original BC scores: AI: {bc_score_list[1]}, HUMAN: {bc_score_list[0]}")
 
284
  # isotonic regression calibration
285
+ ai_score = iso_reg.predict([bc_score_list[1]])[0]
286
+ human_score = 1 - ai_score
287
+ bc_score = {"AI": ai_score, "HUMAN": human_score}
288
+ print(f"Calibration BC scores: AI: {ai_score}, HUMAN: {human_score}")
289
  return bc_score
290
 
291