forked from tatsu-lab/gpt_paper_assistant
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathpush_to_google_chat.py
94 lines (74 loc) · 6.62 KB
/
push_to_google_chat.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
"""A sample to send message on Google Chat group with Python requests.
adapted from https://gist.github.com/gh640/4df1cf28bf2e1b8544487213e3fbd4fe
"""
import os
import requests
from requests.models import Response
import json
from datetime import datetime
from parse_json_to_md import extract_criterion_from_paper
# You need to pass WEBHOOK_URL as an environment variable.
# You can generate a webhok URL in the "Apps & integrations" page of a chat space.
WEBHOOK_URL = os.environ["WEBHOOK_URL"]
def send_text_card(title: str, paragraphs: list[str]) -> Response:
header = {"title": title}
widget = [{"widgets": [{"textParagraph": {"text": p}}]} for p in paragraphs]
cards = [
{
"header": header,
"sections": widget,
},
]
return requests.post(WEBHOOK_URL, json={"cards": cards})
def render_paper(paper_entry: dict) -> str:
"""
:param counter: is the position of the paper in the list
:param paper_entry: is a dict from a json. an example is
{"paperId": "2754e70eaa0c2d40972c47c4c23210f0cece8bfc", "externalIds": {"ArXiv": "2310.16834", "CorpusId": 264451832}, "title": "Discrete Diffusion Language Modeling by Estimating the Ratios of the Data Distribution", "abstract": "Despite their groundbreaking performance for many generative modeling tasks, diffusion models have fallen short on discrete data domains such as natural language. Crucially, standard diffusion models rely on the well-established theory of score matching, but efforts to generalize this to discrete structures have not yielded the same empirical gains. In this work, we bridge this gap by proposing score entropy, a novel discrete score matching loss that is more stable than existing methods, forms an ELBO for maximum likelihood training, and can be efficiently optimized with a denoising variant. We scale our Score Entropy Discrete Diffusion models (SEDD) to the experimental setting of GPT-2, achieving highly competitive likelihoods while also introducing distinct algorithmic advantages. In particular, when comparing similarly sized SEDD and GPT-2 models, SEDD attains comparable perplexities (normally within $+10\\%$ of and sometimes outperforming the baseline). Furthermore, SEDD models learn a more faithful sequence distribution (around $4\\times$ better compared to GPT-2 models with ancestral sampling as measured by large models), can trade off compute for generation quality (needing only $16\\times$ fewer network evaluations to match GPT-2), and enables arbitrary infilling beyond the standard left to right prompting.", "year": 2023, "authors": [{"authorId": "2261494043", "name": "Aaron Lou"}, {"authorId": "83262128", "name": "Chenlin Meng"}, {"authorId": "2490652", "name": "Stefano Ermon"}], "ARXIVID": "2310.16834", "COMMENT": "The paper shows a significant advance in the performance of diffusion language models, directly meeting one of the criteria.", "RELEVANCE": 10, "NOVELTY": 8}, "2310.16779": {"paperId": "edc8953d559560d3237fc0b27175cdb1114c0ca5", "externalIds": {"ArXiv": "2310.16779", "CorpusId": 264451949}, "title": "Multi-scale Diffusion Denoised Smoothing", "abstract": "Along with recent diffusion models, randomized smoothing has become one of a few tangible approaches that offers adversarial robustness to models at scale, e.g., those of large pre-trained models. Specifically, one can perform randomized smoothing on any classifier via a simple\"denoise-and-classify\"pipeline, so-called denoised smoothing, given that an accurate denoiser is available - such as diffusion model. In this paper, we investigate the trade-off between accuracy and certified robustness of denoised smoothing: for example, we question on which representation of diffusion model would maximize the certified robustness of denoised smoothing. We consider a new objective that aims collective robustness of smoothed classifiers across multiple noise levels at a shared diffusion model, which also suggests a new way to compensate the cost of accuracy in randomized smoothing for its certified robustness. This objective motivates us to fine-tune diffusion model (a) to perform consistent denoising whenever the original image is recoverable, but (b) to generate rather diverse outputs otherwise. Our experiments show that this fine-tuning scheme of diffusion models combined with the multi-scale smoothing enables a strong certified robustness possible at highest noise level while maintaining the accuracy closer to non-smoothed classifiers.", "year": 2023, "authors": [{"authorId": "83125078", "name": "Jongheon Jeong"}, {"authorId": "2261688831", "name": "Jinwoo Shin"}], "ARXIVID": "2310.16779", "COMMENT": "The paper presents an advancement in the performance of diffusion models, specifically in the context of denoised smoothing.", "RELEVANCE": 9, "NOVELTY": 7}
:return: a slackbot-appropriate mrkdwn formatted string showing the arxiv id, title, arxiv url, abstract, authors, score and comment (if those fields exist)
"""
# get the arxiv id
arxiv_id = paper_entry["arxiv_id"]
# get the title
title = paper_entry["title"].replace("&", "&")
# get the arxiv url
arxiv_url = f"https://arxiv.org/abs/{arxiv_id}"
# get the authors
authors = paper_entry["authors"]
paper_string = f"<a href='{arxiv_url}'>{title}</a>\n{', '.join(authors)}"
return paper_string
def group_by_topics(topic_ids, paper_strings):
topics = [[] for _ in range(max(topic_ids) + 1)]
for topic, paper in zip(topic_ids, paper_strings):
topics[topic].append(paper)
result = []
like = None
for topic, paperlist in enumerate(topics):
if len(paperlist) == 0:
continue
if topic == 0:
like = '<b>GPT thinks you might like: </b>\n' + '\n\n'.join(paperlist)
else:
block_string = f"<b>Topic {topic}: </b>\n" + '\n\n'.join(paperlist)
result.append(block_string)
if like:
result.append(like)
return result
def push_to_google_chat(papers_dict):
# render each paper
if len(papers_dict) == 0:
return
topic_ids = [
extract_criterion_from_paper(paper) for paper in papers_dict.values()
]
paper_strings = [
render_paper(paper) for _, paper in enumerate(papers_dict.values())
]
paragraphs = group_by_topics(topic_ids, paper_strings)
title = "Arxiv update on " + datetime.today().strftime("%m/%d/%Y")
paragraphs.append("Check <a href='https://variante.github.io/gpt_paper_assistant/'>the web version</a>.")
send_text_card(title, paragraphs)
if __name__ == "__main__":
with open("out/output.json", "r") as f:
output = json.load(f)
push_to_google_chat(output)