Spaces:

alexue4
/

alexue4-text-normalization-ru-new

Sleeping

alexue4 commited on Jul 10, 2024

Commit

1c903eb

verified ·

1 Parent(s): 5e13b07

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,29 +1,38 @@
 import gradio as gr
-# Load the pre-built interface
-interface = gr.load("models/alexue4/text-normalization-ru-new")
-# Function to modify the behavior (example: limiting max tokens and setting examples)
 def custom_function(input_text):
-    # Custom processing here (e.g., limit max tokens)
-    max_tokens = 250  # Set your desired max token limit
-    if len(input_text.split()) > max_tokens:
-        input_text = ' '.join(input_text.split()[:max_tokens])
-    # Call the original function from the interface
-    original_output = interface.predict(input_text)
-    return original_output
-# Customize the examples
 examples = [
     ["в 2006-2010 гг. Вася учился в МГУ"],
     ["я купил iphone 10X за 14990 руб без 3-x часов полдень и т.д."]
 ]
-# Define the new Gradio interface with custom function and examples
-gr.Interface(
     fn=custom_function,
     inputs="text",
     outputs="text",
     examples=examples
-).launch()

 import gradio as gr
+import transformers
+# Load the model
+model_name = "alexue4/text-normalization-ru-new"
+model = transformers.AutoModelForSequenceClassification.from_pretrained(model_name)
+tokenizer = transformers.AutoTokenizer.from_pretrained(model_name)
+# Define the custom function
 def custom_function(input_text):
+    max_tokens = 100  # Set your desired max token limit
+    tokens = tokenizer.tokenize(input_text)
+    if len(tokens) > max_tokens:
+        tokens = tokens[:max_tokens]
+        input_text = tokenizer.convert_tokens_to_string(tokens)
+    inputs = tokenizer(input_text, return_tensors="pt")
+    outputs = model(**inputs)
+    prediction = outputs.logits.argmax(dim=-1).item()
+    return prediction
 examples = [
     ["в 2006-2010 гг. Вася учился в МГУ"],
     ["я купил iphone 10X за 14990 руб без 3-x часов полдень и т.д."]
 ]
+interface = gr.Interface(
     fn=custom_function,
     inputs="text",
     outputs="text",
     examples=examples
+)
+# Launch the interface
+interface.launch()