Commit
·
207d8a5
1
Parent(s):
849b6e1
added code for logs save
Browse files
app.py
CHANGED
|
@@ -3,13 +3,37 @@ import requests
|
|
| 3 |
import os
|
| 4 |
import numpy as np
|
| 5 |
import pandas as pd
|
| 6 |
-
import
|
| 7 |
-
import os
|
| 8 |
# from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, AutoModelForSequenceClassification
|
| 9 |
from questiongenerator import QuestionGenerator
|
| 10 |
|
| 11 |
qg = QuestionGenerator()
|
| 12 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 13 |
|
| 14 |
def generate_questions(article,num_que):
|
| 15 |
result = ''
|
|
@@ -23,9 +47,17 @@ def generate_questions(article,num_que):
|
|
| 23 |
"generated_questions" : generated_questions_list
|
| 24 |
}
|
| 25 |
generated_questions = summarized_data.get("generated_questions",'')
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 26 |
for q in generated_questions:
|
| 27 |
print(q)
|
| 28 |
result = result + q + '\n'
|
|
|
|
| 29 |
return result
|
| 30 |
|
| 31 |
## design 1
|
|
|
|
| 3 |
import os
|
| 4 |
import numpy as np
|
| 5 |
import pandas as pd
|
| 6 |
+
=import json
|
|
|
|
| 7 |
# from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, AutoModelForSequenceClassification
|
| 8 |
from questiongenerator import QuestionGenerator
|
| 9 |
|
| 10 |
qg = QuestionGenerator()
|
| 11 |
+
|
| 12 |
+
HF_TOKEN = os.environ.get("HF_TOKEN")
|
| 13 |
+
DATASET_NAME = "Question_Generation_T5"
|
| 14 |
+
DATASET_REPO_URL = f"https://huggingface.co/datasets/pragnakalp/{DATASET_NAME}"
|
| 15 |
+
DATA_FILENAME = "que_gen_logs.json"
|
| 16 |
+
DATA_FILE = os.path.join("que_gen_logs", DATA_FILENAME)
|
| 17 |
+
DATASET_REPO_ID = "pragnakalp/Question_Generation_T5"
|
| 18 |
+
print("is none?", HF_TOKEN is None)
|
| 19 |
+
# REPOSITORY_DIR = "data"
|
| 20 |
+
# LOCAL_DIR = 'data_local'
|
| 21 |
+
# os.makedirs(LOCAL_DIR,exist_ok=True)
|
| 22 |
+
|
| 23 |
+
try:
|
| 24 |
+
hf_hub_download(
|
| 25 |
+
repo_id=DATASET_REPO_ID,
|
| 26 |
+
filename=DATA_FILENAME,
|
| 27 |
+
cache_dir=DATA_DIRNAME,
|
| 28 |
+
force_filename=DATA_FILENAME
|
| 29 |
+
)
|
| 30 |
+
|
| 31 |
+
except:
|
| 32 |
+
print("file not found")
|
| 33 |
+
|
| 34 |
+
repo = Repository(
|
| 35 |
+
local_dir="que_gen_logs", clone_from=DATASET_REPO_URL, use_auth_token=HF_TOKEN
|
| 36 |
+
)
|
| 37 |
|
| 38 |
def generate_questions(article,num_que):
|
| 39 |
result = ''
|
|
|
|
| 47 |
"generated_questions" : generated_questions_list
|
| 48 |
}
|
| 49 |
generated_questions = summarized_data.get("generated_questions",'')
|
| 50 |
+
entry = {"article": article, "generated_questions": generated_questions, "num_of_question": num_que}
|
| 51 |
+
with open(DATA_FILE, "r") as file:
|
| 52 |
+
data = json.load(file)
|
| 53 |
+
data.append(entry)
|
| 54 |
+
with open(DATA_FILE, "w") as file:
|
| 55 |
+
json.dump(data, file)
|
| 56 |
+
commit_url = repo.push_to_hub()
|
| 57 |
for q in generated_questions:
|
| 58 |
print(q)
|
| 59 |
result = result + q + '\n'
|
| 60 |
+
|
| 61 |
return result
|
| 62 |
|
| 63 |
## design 1
|