forked from OrIdow6/cohost-grab
-
Notifications
You must be signed in to change notification settings - Fork 0
/
grab-script-checks
289 lines (224 loc) · 20.5 KB
/
grab-script-checks
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
format 0
[[]]
not regex .*view-source:.*
not discoveredregex .*iframe\\.?ly.*
successful
[user:sanqui]
some exact https://cohost.org/sanqui
some exact https://staging.cohostcdn.org/header/44212-ce22451d-922d-4dfa-8c4d-74cd8ae99b53-profile.png
some exact https://staging.cohostcdn.org/avatar/44212-f0523470-dd28-4357-9cb9-91b51ce26a66-profile.png?dpr=2&width=80&height=80&fit=cover&auto=webp # TODO assert that images like this always have height and width asserted as 80 - as they are gotten as such for users not the current (even when downscaled client-side)
some exact https://cohost.org/sanqui?page=0
not exact https://cohost.org/sanqui?page=1
# Unclear purpose
some exact https://cohost.org/api/v1/trpc/users.displayPrefs,subscriptions.hasActiveSubscription,login.loggedIn,projects.followingState,posts.profilePosts,projects.isReaderMuting,projects.isReaderBlocking?batch=1&input=%7B%223%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%224%22%3A%7B%22projectHandle%22%3A%22sanqui%22%2C%22page%22%3A0%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Afalse%2C%22hideAsks%22%3Afalse%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%2C%225%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%226%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%7D
# TODO check if this is for any page but 0
some exact https://cohost.org/api/v1/trpc/posts.profilePosts?batch=1&input=%7B%220%22%3A%7B%22projectHandle%22%3A%22sanqui%22%2C%22page%22%3A0%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Afalse%2C%22hideAsks%22%3Afalse%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%7D
# Useless to us (possibly to check if a login has happened in another tab?), but required for playback
some exact https://cohost.org/api/v1/trpc/login.loggedIn,users.displayPrefs,subscriptions.hasActiveSubscription,projects.isReaderMuting,projects.isReaderBlocking,projects.followingState,posts.profilePosts?batch=1&input=%7B%223%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%224%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%225%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%226%22%3A%7B%22projectHandle%22%3A%22sanqui%22%2C%22page%22%3A0%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Afalse%2C%22hideAsks%22%3Afalse%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%7D
some exact https://cohost.org/api/v1/trpc/login.loggedIn,users.displayPrefs,subscriptions.hasActiveSubscription,projects.isReaderMuting,projects.isReaderBlocking,projects.followingState,posts.profilePosts?batch=1&input=%7B%223%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%224%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%225%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%226%22%3A%7B%22projectHandle%22%3A%22sanqui%22%2C%22page%22%3A0%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Atrue%2C%22hideAsks%22%3Atrue%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%7D
# XHR that gets requested on a post
some exact https://cohost.org/api/v1/trpc/users.displayPrefs,subscriptions.hasActiveSubscription,login.loggedIn,projects.followingState,posts.singlePost,projects.isReaderMuting,projects.isReaderBlocking?batch=1&input=%7B%223%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%224%22%3A%7B%22handle%22%3A%22sanqui%22%2C%22postId%22%3A1697007%7D%2C%225%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%226%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%7D
some exact https://cohost.org/api/v1/trpc/login.loggedIn,users.displayPrefs,subscriptions.hasActiveSubscription,projects.isReaderMuting,projects.isReaderBlocking,projects.followingState,posts.singlePost?batch=1&input=%7B%223%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%224%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%225%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%226%22%3A%7B%22handle%22%3A%22sanqui%22%2C%22postId%22%3A1697007%7D%7D
# Site logos
not exact https://cohost.org/static/7ec6f0f3aef87d734f9b.png
not exact https://cohost.org/static/3c154cde88b7ed1ca92a.png
# Post which is purely a repost of another; may eliminate these if we are pressured
# N.b. the tags and first user discovered (the original poster) are still discernable from the main blog page
some exact https://cohost.org/sanqui/post/7345235-empty
some discovered tag:pok%c3%a9mon%20diamond%20but%20not%20the%20one%20from%20game%20freak
some discovered user:telefang
some discovered user:Maverynthia
some discovered https://sanqui.net/etc/telefang_screenshots.png # Post was from another user (despite the domain name) but we can pipe it to #// even though that means a bit of duplication over there
# Another image not posted by this user (not external domain)
# Disabled because we are getting these now because I'm not 100% confident the repost detection won't give false positives
# not regex ^https?://staging\.cohostcdn\.org/attachment/08dfeaa1-9a85-4679-b2f7-744d4609fd92/sanqui\.jpg.*
some discovered usertag:sanqui/english%20translation%20patch
not exact https://cohost.org/sanqui/tagged/english%20translation%20patch
some exact https://cohost.org/sanqui/post/6020724-owl-and-a-crt
not exact https://cohost.org/sanqui/tagged/look%20at%20me%20practicing%20POSSE
some discovered usertag:sanqui/look%20at%20me%20practicing%20POSSE
some discovered tag:look%20at%20me%20practicing%20POSSE
# Ask
some exact https://cohost.org/sanqui/post/2210422-ovo
# Image that was posted by this user
some exact https://staging.cohostcdn.org/attachment/4a953630-0e22-401a-aecc-ef5004bdf248/onix_border_8x_wide.png?width=675&auto=webp&dpr=1
some exact https://staging.cohostcdn.org/attachment/4a953630-0e22-401a-aecc-ef5004bdf248/onix_border_8x_wide.png?width=675&auto=webp&dpr=2
some exact https://staging.cohostcdn.org/attachment/4a953630-0e22-401a-aecc-ef5004bdf248/onix_border_8x_wide.png?width=675&auto=webp&dpr=3
some exact https://staging.cohostcdn.org/attachment/4a953630-0e22-401a-aecc-ef5004bdf248/onix_border_8x_wide.png
# External image embedded in post
some exact https://sanqui.net/etc/ocean-journey-3d.jpg
# External URL
some discovered https://www.digimindsoft.com/Ocean-Journey-3D-Screensaver-57.html
# And in profile
some discovered https://sanqui.net/
# User only mentioned with "@" in profile
some discovered user:tcrf
# Subdomain
some exact https://sanqui.cohost.org/
some exact https://sanqui.cohost.org/?page=0
# some exact https://sanqui.cohost.org/?page=1&hideReplies=true&hideAsks=true Disabled because there are *none* of these, subdomain or not, in cdx
some exact https://sanqui.cohost.org/static/client.9de493d3ba74abc6eacb.css
some regex ^https://sanqui\.cohost\.org/static/runtime\.[a-f0-9]+\.js$
some regex ^https://sanqui\.cohost\.org/static/client\.[a-f0-9]+\.js$
some exact https://sanqui.cohost.org/static/8196.9488211cfaad004027c2.js
some exact https://sanqui.cohost.org/static/client-preact-components-pages-project-page-view.63cef228fcf81849ae53.js
some exact https://sanqui.cohost.org/static/7c05f33b4fe5f8132439.woff2
some exact https://sanqui.cohost.org/static/b07ad0e0d01ba4d56c1a.woff2
some exact https://sanqui.cohost.org/static/1d032f03e8c1619c1840.woff
some exact https://sanqui.cohost.org/static/4860.328a8b56d19750b075f1.js
some exact https://sanqui.cohost.org/static/160a2de1e18bbfbce0d6.woff2
# TODO not suer if I got all of these
# And why not
some exact https://cohost.org/sanqui/rss/public.json
some exact https://cohost.org/sanqui/rss/public.atom
# Original image
some exact https://staging.cohostcdn.org/attachment/4a953630-0e22-401a-aecc-ef5004bdf248/onix_border_8x_wide.png
some discovered user:sanqui+1
[user:sanqui+1]
some exact https://sanqui.cohost.org/?page=1
some exact https://cohost.org/api/v1/trpc/posts.profilePosts?batch=1&input=%7B%220%22%3A%7B%22projectHandle%22%3A%22sanqui%22%2C%22page%22%3A1%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Atrue%2C%22hideAsks%22%3Atrue%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%7D
some exact https://cohost.org/api/v1/trpc/posts.profilePosts?batch=1&input=%7B%220%22%3A%7B%22projectHandle%22%3A%22sanqui%22%2C%22page%22%3A1%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Atrue%2C%22hideAsks%22%3Atrue%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%7D
some exact https://cohost.org/api/v1/trpc/users.displayPrefs,posts.profilePosts?batch=1&input=%7B%221%22%3A%7B%22projectHandle%22%3A%22sanqui%22%2C%22page%22%3A1%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Atrue%2C%22hideAsks%22%3Atrue%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%7D
some exact https://cohost.org/api/v1/trpc/posts.profilePosts?batch=1&input=%7B%220%22%3A%7B%22projectHandle%22%3A%22sanqui%22%2C%22page%22%3A1%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Afalse%2C%22hideAsks%22%3Afalse%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%7D
some exact https://cohost.org/api/v1/trpc/login.loggedIn,users.displayPrefs,subscriptions.hasActiveSubscription,projects.isReaderMuting,projects.isReaderBlocking,projects.followingState,posts.profilePosts?batch=1&input=%7B%223%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%224%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%225%22%3A%7B%22projectHandle%22%3A%22sanqui%22%7D%2C%226%22%3A%7B%22projectHandle%22%3A%22sanqui%22%2C%22page%22%3A1%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Afalse%2C%22hideAsks%22%3Afalse%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%7D
# Ambivalent to whether we get subdomain resources
some exact https://cohost.org/sanqui?page=1
[user:Foxhack]
some discovered user:Foxhack+1
not discovered user:Foxhack+2 # As this should only be discovered by +1
some exact https://staging.cohostcdn.org/attachment/619763b8-1412-498e-a7f4-9e9a4ddd0b06/ded2.gif # From page 0
some exact https://cohost.org/Foxhack/post/7803706-screaming-into-the-v
some exact https://cohost.org/api/v1/trpc/login.loggedIn,users.displayPrefs,subscriptions.hasActiveSubscription,projects.isReaderMuting,projects.isReaderBlocking,projects.followingState,posts.singlePost?batch=1&input=%7B%223%22%3A%7B%22projectHandle%22%3A%22Foxhack%22%7D%2C%224%22%3A%7B%22projectHandle%22%3A%22Foxhack%22%7D%2C%225%22%3A%7B%22projectHandle%22%3A%22Foxhack%22%7D%2C%226%22%3A%7B%22handle%22%3A%22Foxhack%22%2C%22postId%22%3A7803664%7D%7D
some exact https://cohost.org/api/v1/trpc/login.loggedIn,users.displayPrefs,subscriptions.hasActiveSubscription,projects.isReaderMuting,projects.isReaderBlocking,projects.followingState,posts.profilePosts?batch=1&input=%7B%223%22%3A%7B%22projectHandle%22%3A%22Foxhack%22%7D%2C%224%22%3A%7B%22projectHandle%22%3A%22Foxhack%22%7D%2C%225%22%3A%7B%22projectHandle%22%3A%22Foxhack%22%7D%2C%226%22%3A%7B%22projectHandle%22%3A%22Foxhack%22%2C%22page%22%3A0%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Afalse%2C%22hideAsks%22%3Afalse%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%7D
[user:Foxhack+2]
some exact https://cohost.org/Foxhack?page=2
# Image on this page but is a pure repost
# Disabled - the + items get the HTML page before the API request, which means they do a DCP before pure_repost_posts is potentially set
# This technically leads to duplication but seeing as we have 6k items left I can't be bothered, few GiB at most and that's probably an overestimate
# not exact https://staging.cohostcdn.org/attachment/17a2d496-3eef-41b7-a26f-1c52983452ae/image.png?width=675&auto=webp&dpr=2
# And back to normal
some exact https://staging.cohostcdn.org/attachment/4bc5f4a7-ac1f-4788-86b8-b1a7fc33ba48/image.png
some discovered https://www.theverge.com/2024/8/12/24219016/valve-deadlock-hands-on-secret-new-game
some exact https://cohost.org/Foxhack/post/7246433-you-know
some exact https://cohost.org/api/v1/trpc/login.loggedIn,users.displayPrefs,subscriptions.hasActiveSubscription,projects.isReaderMuting,projects.isReaderBlocking,projects.followingState,posts.singlePost?batch=1&input=%7B%223%22%3A%7B%22projectHandle%22%3A%22Foxhack%22%7D%2C%224%22%3A%7B%22projectHandle%22%3A%22Foxhack%22%7D%2C%225%22%3A%7B%22projectHandle%22%3A%22Foxhack%22%7D%2C%226%22%3A%7B%22handle%22%3A%22Foxhack%22%2C%22postId%22%3A7246433%7D%7D
some exact https://cohost.org/api/v1/trpc/posts.profilePosts?batch=1&input=%7B%220%22%3A%7B%22projectHandle%22%3A%22Foxhack%22%2C%22page%22%3A2%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Afalse%2C%22hideAsks%22%3Afalse%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%7D
some exact https://staging.cohostcdn.org/attachment/9ad303fb-8200-47cd-bf44-19c3e8ac36e1/image.png?width=675&auto=webp&dpr=2
some discovered usertag:Foxhack/video%20game%20ad
some discovered tag:video%20game%20ad
[user:Foxhack+17]
some exact https://cohost.org/Foxhack?page=17
some exact https://cohost.org/Foxhack/post/658013-so-how-does-this-pla
some exact https://foxhack.cohost.org/?page=17
some discovered user:Foxhack+18
[user:Foxhack+18]
some exact https://cohost.org/Foxhack?page=18
not regex .*/post/.*
not discoveredregex ^user:Foxhack\\+.*
[usertag:luckyplushy/my%20art]
some regex ^https://cohost\\.org/luckyplushy/tagged/my%20art\\?refTimestamp=17\\d+&skipPosts=20
some regex ^https://cohost\\.org/luckyplushy/tagged/my%20art\\?refTimestamp=17\\d+&skipPosts=60
not exact https://staging.cohostcdn.org/attachment/1dcb6916-b7de-4f2e-8702-1c8d55b9a228/20231115_160048.jpg?width=675&auto=webp&dpr=1
# User with no posts
[user:digitaldragons]
some exact https://cohost.org/digitaldragons
some exact https://digitaldragons.cohost.org/
some exact https://cohost.org/digitaldragons?page=0
some exact https://digitaldragons.cohost.org/?page=0
not exact https://cohost.org/digitaldragons?page=1 # Especially as these go on forever
some exact https://cohost.org/api/v1/trpc/login.loggedIn,users.displayPrefs,subscriptions.hasActiveSubscription,projects.isReaderMuting,projects.isReaderBlocking,projects.followingState,posts.profilePosts?batch=1&input=%7B%223%22%3A%7B%22projectHandle%22%3A%22digitaldragons%22%7D%2C%224%22%3A%7B%22projectHandle%22%3A%22digitaldragons%22%7D%2C%225%22%3A%7B%22projectHandle%22%3A%22digitaldragons%22%7D%2C%226%22%3A%7B%22projectHandle%22%3A%22digitaldragons%22%2C%22page%22%3A0%2C%22options%22%3A%7B%22pinnedPostsAtTop%22%3Atrue%2C%22hideReplies%22%3Afalse%2C%22hideShares%22%3Afalse%2C%22hideAsks%22%3Afalse%2C%22viewingOnProjectPage%22%3Atrue%7D%7D%7D
not discovered user:digitaldragons+1
# User with embeds
[user:sixlegendsgame]
not exact https://iframely.net/api/thumbnail?url=https%3A%2F%2Fyoutu.be%2FL0AGUYXU0ag&key=db0b365a626eb72ce8c169cd30f99ac2&maxwidth=960 # Shows when you allow the Youtube URL, but before playing
not discovered https://youtu.be/L0AGUYXU0ag
not exact https://iframely.net/api/thumbnail?url=https%3A%2F%2Fstore.steampowered.com%2Fapp%2F2768130%2F&key=db0b365a626eb72ce8c169cd30f99ac2&maxwidth=960
not discovered https://store.steampowered.com/app/2768130/
not exact https://cdn.iframe.ly/api/iframely?url=https%3a%2f%2fstore%2esteampowered%2ecom%2fapp%2f2768130%2f&key=db0b365a626eb72ce8c169cd30f99ac2&iframe=1&omit_script=1 # This is escaped as the script does it rather than the browser
not exact https://iframely.net/api/iframe?app=1&url=https%3A%2F%2Fstore.steampowered.com%2Fapp%2F2768130%2F&key=db0b365a626eb72ce8c169cd30f99ac2
not exact https://staging.cohostcdn.org/attachment/ed35dcd5-1dca-4f58-b5a5-19e790149329/davinci.png?width=337&height=197&fit=crop&auto=webp&dpr=1
not exact https://staging.cohostcdn.org/attachment/2083ef06-b9ba-422f-80cf-2639cfeed009/Steam.jpg?width=337&height=197&fit=crop&auto=webp&dpr=1
not exact https://staging.cohostcdn.org/attachment/76d8ccfb-d793-4a8a-a934-954a25bd99f9/Final%20Cutscene%20Climax.png?width=337&height=245&fit=crop&auto=webp&dpr=1
not exact https://staging.cohostcdn.org/attachment/1f240eb2-370c-4b26-a056-f10dff54cc72/dragondancelunarnewyear.png
some discovered user:sixlegendsgame+1
[user:sixlegendsgame+1]
some exact https://iframely.net/api/thumbnail?url=https%3A%2F%2Fyoutu.be%2FL0AGUYXU0ag&key=db0b365a626eb72ce8c169cd30f99ac2&maxwidth=960 # Shows when you allow the Youtube URL, but before playing
some discovered https://youtu.be/L0AGUYXU0ag
some discovered user:sixlegendsgame+2
# Not going to get the actual Youtube content - if we want to do that, #// can handle it
# Second embed (same post)
some exact https://iframely.net/api/thumbnail?url=https%3A%2F%2Fstore.steampowered.com%2Fapp%2F2768130%2F&key=db0b365a626eb72ce8c169cd30f99ac2&maxwidth=960
some discovered https://store.steampowered.com/app/2768130/
some exact https://cdn.iframe.ly/api/iframely?url=https%3a%2f%2fstore%2esteampowered%2ecom%2fapp%2f2768130%2f&key=db0b365a626eb72ce8c169cd30f99ac2&iframe=1&omit_script=1 # This is escaped as the script does it rather than the browser
some exact https://iframely.net/api/iframe?app=1&url=https%3A%2F%2Fstore.steampowered.com%2Fapp%2F2768130%2F&key=db0b365a626eb72ce8c169cd30f99ac2
# Half-height images
some exact https://staging.cohostcdn.org/attachment/ed35dcd5-1dca-4f58-b5a5-19e790149329/davinci.png?width=337&height=197&fit=crop&auto=webp&dpr=1
# N.b. the ones below this might be from +1, I haven't checked them
some exact https://staging.cohostcdn.org/attachment/2083ef06-b9ba-422f-80cf-2639cfeed009/Steam.jpg?width=337&height=197&fit=crop&auto=webp&dpr=1
some exact https://staging.cohostcdn.org/attachment/76d8ccfb-d793-4a8a-a934-954a25bd99f9/Final%20Cutscene%20Climax.png?width=337&height=245&fit=crop&auto=webp&dpr=1
# And a full image, just to make sure
some exact https://staging.cohostcdn.org/attachment/1f240eb2-370c-4b26-a056-f10dff54cc72/dragondancelunarnewyear.png
# Invalid user
[user:digitaldragon444]
some exact https://cohost.org/digitaldragon444
maxrequests 3
# User with noncanonical capitalization
[user:sanquI]
some discovered user:sanqui
maxrequests 400
not discovered user:sanquI+1
not discovered user:sanqui+1
# Someone who seems to have tried to break the tag system with punctuation
[user:this-page-will-break-do-not-repost]
some discovered usertag:this-page-will-break-do-not-repost/%3f
some discovered usertag:this-page-will-break-do-not-repost/%2f
not discovered usertag:this-page-will-break-do-not-repost/?
not discovered usertag:this-page-will-break-do-not-repost//
some discovered tag:%3f
some discovered tag:%2f
not discovered tag:?
not discovered tag:/
[usertag:this-page-will-break-do-not-repost/%3f]
some exact https://cohost.org/this-page-will-break-do-not-repost/tagged/%3f
[tag:%2f]
some exact https://cohost.org/rc/tagged/%2f
not discoveredregex tagext:.*
# Post with redirecting media URL in some meta tag
[post:tangledmacrame/post/1307301-empty]
some exact https://cohost.org/api/v1/attachments/92f06b0e-faee-429c-8cf7-f5cc3e2d79e6
some exact https://staging.cohostcdn.org/attachment/92f06b0e-faee-429c-8cf7-f5cc3e2d79e6/BenBois-Vinyl-records.svg
# Post that 404s even though it's listed on a tag page
[post:LeminWedj/post/4049956-no-discrimination]
some exact https://cohost.org/LeminWedj/post/4049956-no-discrimination
# Account content hidden to logged-out users
[user:lazuliterecursion]
some exact https://cohost.org/lazuliterecursion/rss/public.json
# What it looks like
[user:sailorhannibal+4]
not regex .*base64.*
# Embed with no HTML (domain parking page)
[user:decispark+1]
some exact https://cdn.iframe.ly/api/iframely?url=https%3a%2f%2fabout%2elive%2espace%2fpost%2fthank%2dyou&key=db0b365a626eb72ce8c169cd30f99ac2&iframe=1&omit_script=1
# Bluesky handle with same name as user but diff capitalization - gets read in as a divergence of Cohost caps
[user:RunningDlog]
some exact https://iframely.net/api/iframe?app=1&url=https%3A%2F%2Fbsky.app%2Fprofile%2Frunningdlog.bsky.social&key=db0b365a626eb72ce8c169cd30f99ac2
[tag:video%20game%20preservation]
some exact https://cohost.org/rc/tagged/video%20game%20preservation
some regex ^https?://cohost\\.org/rc/tagged/video%20game%20preservation\\?refTimestamp=17\\d+&skipPosts=40
some discovered user:kaceydotme
some discovered user:witchpixels
not discoveredregex tagext:50/17\\d+/video%20game%20preservation
[tag:furry]
some exact https://cohost.org/rc/tagged/furry
some regex ^https?://cohost\\.org/rc/tagged/furry\\?refTimestamp=17\\d+&skipPosts=40
some regex ^https?://cohost\\.org/rc/tagged/furry\\?refTimestamp=17\\d+&skipPosts=49
not regex ^https?://cohost\\.org/rc/tagged/furry\\?refTimestamp=17\\d+&skipPosts=\d{4}
some discoveredregex tagext:50/17\\d+/furry
[tag:furby]
some discoveredregex tagext:50/17\\d+/furby
[tagext:50/1731051700701/furby]
some discovered tagext:100/1731051700701/furby # As there is a "next" link on p 99
[tagext:100/1731051700701/furby]
not discoveredregex tagext:.*
# Single quote and explamation mark get pre-urldecoded by wget
[tag:We%27ll%20see%20if%20that%20helps%21%21]
some regex ^https?://cohost\\.org/.*