Update app.py
Browse files
app.py
CHANGED
@@ -79,6 +79,17 @@ def summarize_paper_and_save_to_sheet(paper_id):
|
|
79 |
worksheet.append_row([paper_id, paper_url, summary, token])
|
80 |
return summary, token
|
81 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
82 |
def gradio_interface():
|
83 |
paper_links = fetch_paper_links("https://huggingface.co/papers")
|
84 |
paper_ids = set(link.split('/')[-1] for link in paper_links)
|
@@ -88,13 +99,13 @@ def gradio_interface():
|
|
88 |
|
89 |
for paper_id in paper_ids:
|
90 |
summary_info = ""
|
91 |
-
|
|
|
92 |
summary, tokens_used = summarize_paper_and_save_to_sheet(paper_id)
|
93 |
total_tokens_used += tokens_used
|
94 |
-
|
95 |
-
|
96 |
-
|
97 |
-
summary_info += f"Error processing paper ID {paper_id}: {e}\n"
|
98 |
|
99 |
summaries.append(summary_info)
|
100 |
|
|
|
79 |
worksheet.append_row([paper_id, paper_url, summary, token])
|
80 |
return summary, token
|
81 |
|
82 |
+
def find_paper_in_sheet(paper_id):
|
83 |
+
"""スプレッドシートから指定されたpaper_idを検索し、該当する行があればその内容を返す。"""
|
84 |
+
records = worksheet.get_all_records()
|
85 |
+
|
86 |
+
# 各行をループしてpaper_idを検索
|
87 |
+
for index, record in enumerate(records, start=2): # 行インデックスは1ではなく2から開始(ヘッダー行を除く)
|
88 |
+
if record['ID'] == paper_id:
|
89 |
+
return record['summary']
|
90 |
+
# 該当する行がない場合はNoneを返す
|
91 |
+
return None
|
92 |
+
|
93 |
def gradio_interface():
|
94 |
paper_links = fetch_paper_links("https://huggingface.co/papers")
|
95 |
paper_ids = set(link.split('/')[-1] for link in paper_links)
|
|
|
99 |
|
100 |
for paper_id in paper_ids:
|
101 |
summary_info = ""
|
102 |
+
summary = find_paper_in_sheet(paper_id)
|
103 |
+
if summary == None:
|
104 |
summary, tokens_used = summarize_paper_and_save_to_sheet(paper_id)
|
105 |
total_tokens_used += tokens_used
|
106 |
+
|
107 |
+
paper_id_url = f"https://arxiv.org/pdf/{paper_id}.pdf"
|
108 |
+
summary_info += f'論文: {paper_id_url}\n{summary}\n'
|
|
|
109 |
|
110 |
summaries.append(summary_info)
|
111 |
|