Commit
·
207d8a5
1
Parent(s):
849b6e1
added code for logs save
Browse files
app.py
CHANGED
@@ -3,13 +3,37 @@ import requests
|
|
3 |
import os
|
4 |
import numpy as np
|
5 |
import pandas as pd
|
6 |
-
import
|
7 |
-
import os
|
8 |
# from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, AutoModelForSequenceClassification
|
9 |
from questiongenerator import QuestionGenerator
|
10 |
|
11 |
qg = QuestionGenerator()
|
12 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
13 |
|
14 |
def generate_questions(article,num_que):
|
15 |
result = ''
|
@@ -23,9 +47,17 @@ def generate_questions(article,num_que):
|
|
23 |
"generated_questions" : generated_questions_list
|
24 |
}
|
25 |
generated_questions = summarized_data.get("generated_questions",'')
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
26 |
for q in generated_questions:
|
27 |
print(q)
|
28 |
result = result + q + '\n'
|
|
|
29 |
return result
|
30 |
|
31 |
## design 1
|
|
|
3 |
import os
|
4 |
import numpy as np
|
5 |
import pandas as pd
|
6 |
+
=import json
|
|
|
7 |
# from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, AutoModelForSequenceClassification
|
8 |
from questiongenerator import QuestionGenerator
|
9 |
|
10 |
qg = QuestionGenerator()
|
11 |
+
|
12 |
+
HF_TOKEN = os.environ.get("HF_TOKEN")
|
13 |
+
DATASET_NAME = "Question_Generation_T5"
|
14 |
+
DATASET_REPO_URL = f"https://huggingface.co/datasets/pragnakalp/{DATASET_NAME}"
|
15 |
+
DATA_FILENAME = "que_gen_logs.json"
|
16 |
+
DATA_FILE = os.path.join("que_gen_logs", DATA_FILENAME)
|
17 |
+
DATASET_REPO_ID = "pragnakalp/Question_Generation_T5"
|
18 |
+
print("is none?", HF_TOKEN is None)
|
19 |
+
# REPOSITORY_DIR = "data"
|
20 |
+
# LOCAL_DIR = 'data_local'
|
21 |
+
# os.makedirs(LOCAL_DIR,exist_ok=True)
|
22 |
+
|
23 |
+
try:
|
24 |
+
hf_hub_download(
|
25 |
+
repo_id=DATASET_REPO_ID,
|
26 |
+
filename=DATA_FILENAME,
|
27 |
+
cache_dir=DATA_DIRNAME,
|
28 |
+
force_filename=DATA_FILENAME
|
29 |
+
)
|
30 |
+
|
31 |
+
except:
|
32 |
+
print("file not found")
|
33 |
+
|
34 |
+
repo = Repository(
|
35 |
+
local_dir="que_gen_logs", clone_from=DATASET_REPO_URL, use_auth_token=HF_TOKEN
|
36 |
+
)
|
37 |
|
38 |
def generate_questions(article,num_que):
|
39 |
result = ''
|
|
|
47 |
"generated_questions" : generated_questions_list
|
48 |
}
|
49 |
generated_questions = summarized_data.get("generated_questions",'')
|
50 |
+
entry = {"article": article, "generated_questions": generated_questions, "num_of_question": num_que}
|
51 |
+
with open(DATA_FILE, "r") as file:
|
52 |
+
data = json.load(file)
|
53 |
+
data.append(entry)
|
54 |
+
with open(DATA_FILE, "w") as file:
|
55 |
+
json.dump(data, file)
|
56 |
+
commit_url = repo.push_to_hub()
|
57 |
for q in generated_questions:
|
58 |
print(q)
|
59 |
result = result + q + '\n'
|
60 |
+
|
61 |
return result
|
62 |
|
63 |
## design 1
|