Spaces:
Running
Running
Refactor paper_data and summarize_paper functions for improved parameter handling and clarity
adbfd57
import os | |
import html | |
import re | |
import time | |
import requests | |
import dotenv | |
import mistune | |
from image import fetch_image | |
dotenv.load_dotenv() | |
access_key = os.getenv('ACCESS_KEY') | |
client_id = os.getenv('CLIENT_ID') | |
client_secret = os.getenv('CLIENT_SECRET') | |
refresh_token = os.getenv('REFRESH_TOKEN') | |
blog_id = os.getenv('BLOG_ID') | |
imgbb_api_key = os.getenv('IMGBB_API_KEY') | |
def generate_post_html(doi, title, category, summary, mindmap, citation): | |
doi = doi.split("https://")[-1] | |
title = title.replace("{", r'{').replace("}", r'}') | |
title = re.sub(r"\\(?![a-zA-Z])", r"", title) | |
summary = summary.replace("{", r'{').replace("}", r'}') | |
mindmap = mindmap.replace("{", r'{').replace("}", r'}') | |
citation = citation.replace("{", r'{').replace("}", r'}') | |
citation = mistune.html(citation.replace("&", "&").strip()) | |
image = fetch_image(title, summary, imgbb_api_key) | |
html_summary = mistune.html(summary) | |
post = f""" | |
<div id="paper_post"> | |
<img style="display:block; width:100%; height:100%;" id="paper_image" | |
src="{image.strip()}" | |
alt="{title.strip()}"> | |
<br> | |
<br> | |
<div id="paper_summary"> | |
{html_summary.replace("&", "&").strip()} | |
</div> | |
<br> | |
<h2>Mindmap</h2> | |
<p><small><em>If MindMap doesn't load, go to the <a href="/">Homepage</a> and visit blog again or <a | |
href="/#">Switch to Android App (Under Development)</a>.</em></small></p> | |
<div class="markmap" id="paper_mindmap"> | |
<script type="text/template"> | |
{mindmap.replace("&", "&").replace(":", "=>").strip()} | |
</script> | |
</div> | |
<br> | |
<h2>Citation</h2> | |
<div id="paper_citation"> | |
{mistune.html(citation.replace("&", "&").strip())} | |
</div> | |
<script> | |
const paperImage = document.querySelector( | |
'img[style="display:block; width:100%; height:100%;"][id="paper_image"]' | |
); | |
if (paperImage) {{ | |
const tablOfContents = document.createElement("div"); | |
tablOfContents.innerHTML = "<b>{{getToc}} $title={{Table of Contents}}</b>"; | |
const brElement = paperImage.nextElementSibling; | |
if (brElement && brElement.tagName === "BR") {{ | |
brElement.insertAdjacentElement("afterend", tablOfContents); | |
}} | |
}} | |
</script> | |
<script> | |
window.markmap = {{ | |
autoLoader: {{ | |
toolbar: true, | |
}}, | |
}}; | |
</script> | |
<script src="https://cdn.jsdelivr.net/npm/markmap-autoloader@latest"></script> | |
<script> | |
window.addEventListener('load', function() {{ | |
setTimeout(function() {{ | |
const element = document.querySelector('div.mm-toolbar-item[title="Fit window size"]'); | |
console.log(element); | |
if (element) {{ | |
element.click(); | |
}} else {{ | |
console.log('Element not found'); | |
}} | |
}}, 0); | |
}}); | |
</script> | |
<style> | |
.markmap {{ | |
position: relative; | |
}} | |
.markmap > svg {{ | |
width: 100%; | |
border: 2px solid #000; | |
height: 80dvh; | |
}} | |
</style> | |
<script> | |
window.addEventListener('load', function() {{ | |
const anchor = document.querySelector('a.mm-toolbar-brand'); | |
if (anchor) {{ | |
anchor.href = '/'; | |
const img = anchor.querySelector('img'); | |
if (img) {{ | |
img.src = ''; | |
img.alt = 'ReXplore'; | |
}} | |
const span = anchor.querySelector('span'); | |
if (span) {{ | |
span.textContent = 'ReXplore'; | |
}} | |
}} else {{ | |
console.log('Anchor element not found'); | |
}} | |
}}); | |
</script> | |
</div> | |
""" | |
return post, image | |
def create_post(doi, title, category, summary, mindmap, citation): | |
post_title = title | |
post_category = f"{category}" | |
try: | |
post_body, post_image = generate_post_html(doi, title, category, summary, mindmap, citation) | |
# with open('post.html', 'w') as f: | |
# f.write(post_body) | |
# exit(code=0) | |
except Exception as e: | |
print(f"Error generating post: {e}") | |
return None, None, None, None | |
return post_title, post_category, post_body, post_image | |
def post_post(title, category, body, image): | |
title = re.sub(r"\\(?![a-zA-Z])", r"", title) | |
response = None | |
try: | |
data = requests.post( | |
url='https://oauth2.googleapis.com/token', | |
data={ | |
'grant_type': 'refresh_token', | |
'client_secret': client_secret, | |
'refresh_token': refresh_token, | |
'client_id': client_id, | |
}, | |
).json() | |
url = f"https://blogger.googleapis.com/v3/blogs/{blog_id}/posts" | |
headers = { | |
'Authorization': f"Bearer {data['access_token']}", | |
"content-type": "application/json" | |
} | |
post_data = { | |
"kind": "blogger#post", | |
"blog": { | |
"id": blog_id | |
}, | |
"images": [{ | |
"url": image | |
}], | |
"title": title, | |
"content": body, | |
"labels": [category, "ZZZZZZZZZ"] | |
} | |
response = requests.post(url, headers=headers, json=post_data).json() | |
if response['status'] != 'LIVE': | |
print(response) | |
if response['status'] == 'LIVE': | |
print(f"The post '{title}' is {response['status']}") | |
return True | |
else: | |
print(response) | |
print(f"Error posting {title}: {response}") | |
return False | |
except Exception as e: | |
print(response) | |
print(f"Error posting {title}: {e}") | |
return False | |
def post_blog(doi, title, category, summary, mindmap, citation, uaccess_key, wait_time=5): | |
if uaccess_key != access_key: | |
return False | |
else: | |
status = True | |
post_title, post_category, post_body, post_image = create_post(doi, title, category, summary, mindmap, citation) | |
if not all([post_title, post_category, post_body, post_image]): | |
print(f'Failed to create post {post_title}') | |
return False | |
post_title = post_title.replace("&", "&") | |
if "&" in post_title: | |
return False | |
status = post_post(post_title, post_category, post_body, post_image) | |
print(f"Waiting for {wait_time*60} seconds...") | |
time.sleep(wait_time*60) | |
if status: | |
print('Post created successfully') | |
return True | |
else: | |
print('Failed to create post') | |
return False | |