Spaces:

polygraf-ai
/

copyright_checker

Runtime error

eljanmahammadli commited on Feb 23, 2024

Commit

2d19a26

1 Parent(s): 4302b12

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -188,7 +188,7 @@ text_bc_model_path = "polygraf-ai/v3-bert-3-2m-trun-bc-lighter-spec"
 text_bc_tokenizer = AutoTokenizer.from_pretrained(text_bc_model_path)
 text_bc_model = AutoModelForSequenceClassification.from_pretrained(text_bc_model_path).to(device)
-text_mc_model_path = "polygraf-ai/ai-text-detection-mc-robert-open-ai-detector-v4"
 text_mc_tokenizer = AutoTokenizer.from_pretrained(text_mc_model_path)
 text_mc_model = AutoModelForSequenceClassification.from_pretrained(text_mc_model_path).to(device)
@@ -213,7 +213,7 @@ def update_character_count(text):
     return f"{len(text)} characters"
-def split_text_allow_complete_sentences_nltk(text, max_length=256, tolerance=40, min_last_segment_length=150, type_det = 'bc'):
     sentences = nltk.sent_tokenize(text)
     segments = []
     current_segment = []

 text_bc_tokenizer = AutoTokenizer.from_pretrained(text_bc_model_path)
 text_bc_model = AutoModelForSequenceClassification.from_pretrained(text_bc_model_path).to(device)
+text_mc_model_path = "polygraf-ai/text-detect-mc-bert-base-uncased-mistral-openai-447k-256"
 text_mc_tokenizer = AutoTokenizer.from_pretrained(text_mc_model_path)
 text_mc_model = AutoModelForSequenceClassification.from_pretrained(text_mc_model_path).to(device)
     return f"{len(text)} characters"
+def split_text_allow_complete_sentences_nltk(text, max_length=256, tolerance=40, min_last_segment_length=150, type_det='bc'):
     sentences = nltk.sent_tokenize(text)
     segments = []
     current_segment = []