pragnakalp commited on
Commit
207d8a5
·
1 Parent(s): 849b6e1

added code for logs save

Browse files
Files changed (1) hide show
  1. app.py +35 -3
app.py CHANGED
@@ -3,13 +3,37 @@ import requests
3
  import os
4
  import numpy as np
5
  import pandas as pd
6
- import io
7
- import os
8
  # from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, AutoModelForSequenceClassification
9
  from questiongenerator import QuestionGenerator
10
 
11
  qg = QuestionGenerator()
12
- # num_que = 5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
 
14
  def generate_questions(article,num_que):
15
  result = ''
@@ -23,9 +47,17 @@ def generate_questions(article,num_que):
23
  "generated_questions" : generated_questions_list
24
  }
25
  generated_questions = summarized_data.get("generated_questions",'')
 
 
 
 
 
 
 
26
  for q in generated_questions:
27
  print(q)
28
  result = result + q + '\n'
 
29
  return result
30
 
31
  ## design 1
 
3
  import os
4
  import numpy as np
5
  import pandas as pd
6
+ =import json
 
7
  # from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, AutoModelForSequenceClassification
8
  from questiongenerator import QuestionGenerator
9
 
10
  qg = QuestionGenerator()
11
+
12
+ HF_TOKEN = os.environ.get("HF_TOKEN")
13
+ DATASET_NAME = "Question_Generation_T5"
14
+ DATASET_REPO_URL = f"https://huggingface.co/datasets/pragnakalp/{DATASET_NAME}"
15
+ DATA_FILENAME = "que_gen_logs.json"
16
+ DATA_FILE = os.path.join("que_gen_logs", DATA_FILENAME)
17
+ DATASET_REPO_ID = "pragnakalp/Question_Generation_T5"
18
+ print("is none?", HF_TOKEN is None)
19
+ # REPOSITORY_DIR = "data"
20
+ # LOCAL_DIR = 'data_local'
21
+ # os.makedirs(LOCAL_DIR,exist_ok=True)
22
+
23
+ try:
24
+ hf_hub_download(
25
+ repo_id=DATASET_REPO_ID,
26
+ filename=DATA_FILENAME,
27
+ cache_dir=DATA_DIRNAME,
28
+ force_filename=DATA_FILENAME
29
+ )
30
+
31
+ except:
32
+ print("file not found")
33
+
34
+ repo = Repository(
35
+ local_dir="que_gen_logs", clone_from=DATASET_REPO_URL, use_auth_token=HF_TOKEN
36
+ )
37
 
38
  def generate_questions(article,num_que):
39
  result = ''
 
47
  "generated_questions" : generated_questions_list
48
  }
49
  generated_questions = summarized_data.get("generated_questions",'')
50
+ entry = {"article": article, "generated_questions": generated_questions, "num_of_question": num_que}
51
+ with open(DATA_FILE, "r") as file:
52
+ data = json.load(file)
53
+ data.append(entry)
54
+ with open(DATA_FILE, "w") as file:
55
+ json.dump(data, file)
56
+ commit_url = repo.push_to_hub()
57
  for q in generated_questions:
58
  print(q)
59
  result = result + q + '\n'
60
+
61
  return result
62
 
63
  ## design 1