-
Notifications
You must be signed in to change notification settings - Fork 0
/
summarize_arxiv_paper.py
26 lines (19 loc) · 1.12 KB
/
summarize_arxiv_paper.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
import os
from utils.pdf_helper.read_pdf_from_local import read_pdf_exclude_pages
from utils.pdf_helper.get_pdf_from_arxiv import read_pdf_from_url
from utils.pdf_helper.pdf_summary_report_writer import create_or_append_pdf
from utils.transformers.openai_summarizer import openAI_summarizer_wrapper
def summarize_local_pdf_using_openai(input_file, output_file, pages_to_exclude):
input_file_content = read_pdf_exclude_pages(input_file, pages_to_exclude)
summarized_report = openAI_summarizer_wrapper(input_file_content)
print(summarized_report)
create_or_append_pdf(output_file, summarized_report)
return
base_input_path = "paper_pdf_repo/research_papers/"
base_output_path = "paper_pdf_repo/summaries/"
input_filename = "A_Survey_on_Evaluation_of_Large_Language_Models.pdf"
output_filename = "A_Survey_on_Evaluation_of_Large_Language_Models_Summary.pdf"
input_file = os.path.join(base_input_path, input_filename)
output_file = os.path.join(base_output_path, output_filename)
pages_to_exclude = [34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45]
summarize_local_pdf_using_openai(input_file, output_file, pages_to_exclude)