numind
/

NuExtract-v1.5

Text Generation

Model card Files Files and versions Community

Update README.md

#3

by arthrod - opened 13 days ago

base: refs/heads/main

←

from: refs/pr/3

Discussion Files changed

Files changed (1) hide show

README.md +2 -2

README.md CHANGED Viewed

@@ -49,7 +49,7 @@ To use the model:
 import json
 from transformers import AutoModelForCausalLM, AutoTokenizer
-def predict_NuExtract(model, tokenizer, texts, template, batch_size=1, max_length=10_000, max_new_tokens=4_000):
     template = json.dumps(json.loads(template), indent=4)
     prompts = [f"""<|input|>\n### Template:\n{template}\n### Text:\n{text}\n\n<|output|>""" for text in texts]
@@ -104,7 +104,7 @@ Sliding window prompting:
 ```python
 import json
-MAX_INPUT_SIZE = 20_000
 MAX_NEW_TOKENS = 6000
 def clean_json_text(text):

 import json
 from transformers import AutoModelForCausalLM, AutoTokenizer
+def predict_NuExtract(model, tokenizer, texts, template, batch_size=1, max_length=10000, max_new_tokens=4000):
     template = json.dumps(json.loads(template), indent=4)
     prompts = [f"""<|input|>\n### Template:\n{template}\n### Text:\n{text}\n\n<|output|>""" for text in texts]
 ```python
 import json
+MAX_INPUT_SIZE = 20000
 MAX_NEW_TOKENS = 6000
 def clean_json_text(text):