forked from JessicaMulein/duality-social
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathduality-social-lib.ts
269 lines (239 loc) · 7.91 KB
/
duality-social-lib.ts
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
import sanitizeHtml from 'sanitize-html';
import { v4 } from 'uuid';
import {
isValidIconMarkup,
parseIconMarkup,
stripIconMarkup,
} from './font-awesome/font-awesome';
import customFootnote from './markdown-it-footnote-currenturl';
// eslint-disable-next-line @typescript-eslint/no-var-requires
const MarkdownIt = require('markdown-it');
const markdownItPlugins = [
{ plugin: require('markdown-it-todo-lists'), options: { enabled: true } },
{ plugin: require('markdown-it-mark') },
{ plugin: require('markdown-it-table-of-contents') },
{ plugin: require('markdown-it-deflist') },
{ plugin: require('markdown-it-container'), options: 'info' },
{ plugin: require('markdown-it-abbr') },
{ plugin: require('markdown-it-footnote') },
{ plugin: customFootnote },
];
/**
* Makes a data:// URL from a base64 encoded binary blob string containing a PNG image
* @param imageBase64Json String containing b64_json
*/
export function makeDataUrl(imageBase64Json: string): string {
return `data:image/png;base64,${imageBase64Json}`;
}
// /**
// * Given an input image size, return the closest image size our AI can process
// * @param size
// * @returns
// */
// export function closestImageSize(size: number): CreateImageRequestSizeEnum {
// // If size is greater than or equal to 1024, return 1024
// // If size is greater than or equal to 768, return 1024 (round up)
// // If size is greater than or equal to 512, return 512
// // If size is greater than or equal to 256, return 512 (round up)
// // If size is less than or equal to 384, return 256
// if (size >= 1024 || (size >= 768 && size < 1024)) {
// return CreateImageRequestSizeEnum._1024x1024;
// } else if (size >= 512 || (size >= 256 && size < 512)) {
// return CreateImageRequestSizeEnum._512x512;
// }
// return CreateImageRequestSizeEnum._256x256;
// }
/**
* Converts an image data url to a File object
* @param imageDataUrl
* @param filename
* @returns
*/
export function imageDataUrlToFile(
imageDataUrl: string,
filename = 'image.png',
): File {
if (!imageDataUrl.startsWith('data:image/png;base64,')) {
throw new Error('Invalid image data URL');
}
// Extract the base64 data from the URL
const base64Data = imageDataUrl.split(',')[1];
// Convert base64 to binary data
const byteCharacters = atob(base64Data);
const byteNumbers = new Array(byteCharacters.length);
for (let i = 0; i < byteCharacters.length; i++) {
byteNumbers[i] = byteCharacters.charCodeAt(i);
}
const byteArray = new Uint8Array(byteNumbers);
// Create a blob from the binary data
const imageBlob = new Blob([byteArray], { type: 'image/png' });
// Convert the blob to a file
const imageFile = new File([imageBlob], filename, { type: 'image/png' });
return imageFile;
}
/**
* Converts a markdown string to HTML
* @param markdown
* @returns
*/
export function parseMarkdown(
markdown: string,
docId?: string,
currentUrl?: string,
): string {
const md = MarkdownIt('default').set({
breaks: true,
html: true,
linkify: true,
typographer: true,
xhtmlOut: true,
});
markdownItPlugins.forEach(({ plugin, options }) => {
if (options !== undefined) {
md.use(plugin, options);
} else {
md.use(plugin);
}
});
const env = {
docId: docId ? docId : v4(),
currentUrl: currentUrl ? currentUrl : '',
};
return md.render(markdown, env);
}
/**
* Strips HTML tags/attributes, parses markdown, then parses our custom icon markup
* @param content
* @returns
*/
export function parsePostContent(
content: string,
isBlogPost: boolean,
docId?: string,
currentUrl?: string,
): string {
// Phase 1: Strip HTML
// we strip the html first because we don't support HTML in posts,
// but our syntax is too close to markdown so it gets parsed as HTML
content = sanitizeHtml(content, {
allowedTags: [], // Strip all tags
allowedAttributes: {}, // Strip all attributes
});
// Phase 2: Parse markdown or add line breaks
if (isBlogPost) {
content = parseMarkdown(content, docId, currentUrl);
} else {
// Replace newlines with <br> tags for non-blog posts
content = content.replace(/\n/g, '<br />');
}
// Phase 3: Parse our custom icon syntax
content = parseIconMarkup(content);
// Trim leading/trailing whitespace
content = content.trim();
return content;
}
/**
* Prepares content for character count by replacing or stripping HTML tags.
* - Replaces valid icon markup with a bullet character.
* - Replaces <br> tags with newline characters.
* - Replaces <a> tags with a bullet character for the URL and includes the text content.
* - Replaces <img> tags with their alt text or a bullet character if alt is not present.
* - Strips all other HTML tags and attributes.
* - Replaces CRLF pairs with a single newline character.
* @param input
* @param isBlogPost
* @returns
*/
export function prepareContentForCharacterCount(
input: string,
isBlogPost: boolean,
): string {
// Replace valid icon markup with a bullet character for character counting
input = input.replace(/\{\{[^}]+\}\}/g, (match) => {
return isValidIconMarkup(match) ? '•' : match;
});
// process markdown if it's a blog post
if (isBlogPost) {
input = parseMarkdown(input);
}
// Replace <br> tags with newline characters for counting
input = input.replace(/<br\s*\/?>\s*\n*/gi, '\n');
// Replace <a> tags with their URLs and text content
input = input.replace(/<a\s+href="[^"]*">([^<]*)<\/a>/gi, (match, p1) => {
return '•' + p1;
});
// Replace <img> tags with their alt text or a bullet character
input = input.replace(/<img\s+[^>]*alt="([^"]*)"[^>]*>/gi, (match, p1) => {
return p1 || '•';
});
// strip HTML for character counting
input = sanitizeHtml(input, {
allowedTags: [], // Strip all tags
allowedAttributes: {}, // Strip all attributes
});
// Replace CRLF pairs with a single newline character
input = input.replace(/\r\n/g, '\n');
// remove excess whitespace
input = input.trim();
return input;
}
/**
* Custom character counter:
* 1) emoji are 1 count
* 2) unicode characters are 1 count each
* 3) our special icon markup {{xxx}} is 1 count. But we only want to recognize valid {{ }} icon codes, and ignore any invalid ones. See parseIconMarkup.
* 4) CR/LF counts as 1 count
* 5) links are 1 count each
* @param {string} input - The input string to count characters from.
* @returns {number} - The total character count.
*/
export function getCharacterCount(input: string, isBlogPost: boolean): number {
input = prepareContentForCharacterCount(input, isBlogPost);
// Use Array.from to handle Unicode characters properly
const characters = Array.from(input);
return characters.length;
}
/**
* Sanitizes whitespace in a string by replacing sequential whitespace with single space
* @param input
* @returns
*/
export function sanitizeWhitespace(input: string): string {
// replace all whitespace with a single space
return input.replace(/\s+/g, ' ').trim();
}
/**
* Sanitized whitespace and strips icon markup prior to submission to AI
* @param input
* @returns
*/
export function sanitizeForAi(input: string): string {
const sanitized = sanitizeWhitespace(input);
const stripped = stripIconMarkup(sanitized);
return stripped;
}
/**
* Gets the timezone offset in minutes for a given timezone.
* @param timezone
* @returns
*/
export function getTimezoneOffset(timezone: string): number {
const date = new Date();
const utcDate = new Date(date.toLocaleString('en-US', { timeZone: 'UTC' }));
const tzDate = new Date(date.toLocaleString('en-US', { timeZone: timezone }));
return (utcDate.getTime() - tzDate.getTime()) / 60000;
}
/**
* Checks if a timezone is valid
* @param timezone
* @returns
*/
export function isValidTimezone(timezone: string): boolean {
try {
// If the timezone is invalid, getTimezoneOffset will throw an error
getTimezoneOffset(timezone);
return true;
} catch (error) {
return false;
}
}