Spaces:
Sleeping
Sleeping
| import streamlit as st | |
| import requests | |
| from transformers import pipeline, BertTokenizer | |
| # Function to generate answers using the BERT model | |
| def generate_answers(chunks, question): | |
| # Initialize the BERT tokenizer | |
| tokenizer = BertTokenizer.from_pretrained("bert-large-uncased-whole-word-masking-finetuned-squad") | |
| # Initialize the question-answering pipeline | |
| model = pipeline("question-answering", model="bert-large-uncased-whole-word-masking-finetuned-squad") | |
| # Concatenate chunks into a single text | |
| paper_text = ' '.join(chunks) | |
| # Generate answers for the question based on the entire context | |
| answer = model(question, paper_text) | |
| return answer['answer'] | |
| # Streamlit app | |
| st.title("Research Paper Question Answering") | |
| paper_link = st.text_input("Enter the link to the research paper (Arxiv link):") | |
| question = st.text_input("Enter your question:") | |
| if st.button("Generate Answer"): | |
| if not (paper_link and question): | |
| st.warning("Please provide both the paper link and the question.") | |
| else: | |
| # Download the research paper | |
| response = requests.get(paper_link) | |
| paper_text = response.text | |
| # Split the paper text into chunks of 512 words | |
| paper_chunks = [paper_text[i:i+512] for i in range(0, len(paper_text), 512)] | |
| # Generate answer based on chunks | |
| answer = generate_answers(paper_chunks, question) | |
| st.success("Answer generated successfully!") | |
| st.text("Generated Answer:") | |
| st.write(answer) | |