Skip to content
This repository has been archived by the owner on Sep 19, 2024. It is now read-only.

feat: change to markdown and map html to markdown #688

Draft
wants to merge 7 commits into
base: development
Choose a base branch
from
Draft
Show file tree
Hide file tree
Changes from 4 commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 4 additions & 2 deletions package.json
Original file line number Diff line number Diff line change
Expand Up @@ -41,20 +41,22 @@
"ajv": "^8.11.2",
"ajv-formats": "^2.1.1",
"axios": "^1.3.2",
"decimal.js": "^10.4.3",
"copyfiles": "^2.4.1",
"decimal.js": "^10.4.3",
"ethers": "^5.7.2",
"exponential-backoff": "^3.1.1",
"husky": "^8.0.2",
"jimp": "^0.22.4",
"js-yaml": "^4.1.0",
"libsodium-wrappers": "^0.7.11",
"lint-staged": "^13.1.0",
"mdast-util-from-markdown": "^0.8.5",
"mdast-util-gfm": "^0.1.2",
"micromark-extension-gfm": "^0.3.3",
"ms": "^2.1.3",
"node-html-parser": "^6.1.5",
"node-html-to-image": "^3.3.0",
"nodemon": "^2.0.19",
"parse5": "^7.1.2",
"prettier": "^2.7.1",
"probot": "^12.2.4",
"telegraf": "^4.11.2",
Expand Down
1 change: 1 addition & 0 deletions src/decs.d.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
declare module "mdast-util-gfm";
60 changes: 48 additions & 12 deletions src/handlers/payout/post.ts
Original file line number Diff line number Diff line change
@@ -1,10 +1,11 @@
import { getWalletAddress } from "../../adapters/supabase";
import { getBotConfig, getBotContext, getLogger } from "../../bindings";
import { addCommentToIssue, generatePermit2Signature, getAllIssueComments, getIssueDescription, getTokenSymbol, parseComments } from "../../helpers";
import { Incentives, MarkdownItem, Payload, StateReason, UserType } from "../../types";
import { Incentives, MarkdownItem, MarkdownItems, Payload, StateReason, UserType } from "../../types";
import { commentParser } from "../comment";
import Decimal from "decimal.js";
import { bountyInfo } from "../wildcard";
import { HTMLItem } from "../../types/html";

const ItemsToExclude: string[] = [MarkdownItem.BlockQuote];
/**
Expand Down Expand Up @@ -62,7 +63,7 @@ export const incentivizeComments = async () => {
return;
}

const issueComments = await getAllIssueComments(issue.number, "full");
const issueComments = await getAllIssueComments(issue.number);
logger.info(`Getting the issue comments done. comments: ${JSON.stringify(issueComments)}`);
const issueCommentsByUser: Record<string, string[]> = {};
for (const issueComment of issueComments) {
Expand All @@ -73,14 +74,14 @@ export const incentivizeComments = async () => {
logger.info(`Skipping to parse the comment because it contains commands. comment: ${JSON.stringify(issueComment)}`);
continue;
}
if (!issueComment.body_html) {
logger.info(`Skipping to parse the comment because body_html is undefined. comment: ${JSON.stringify(issueComment)}`);
if (!issueComment.body) {
logger.info(`Skipping to parse the comment because body is undefined. comment: ${JSON.stringify(issueComment)}`);
continue;
}
if (!issueCommentsByUser[user.login]) {
issueCommentsByUser[user.login] = [];
}
issueCommentsByUser[user.login].push(issueComment.body_html);
issueCommentsByUser[user.login].push(issueComment.body);
}
const tokenSymbol = await getTokenSymbol(paymentToken, rpc);
logger.info(`Filtering by the user type done. commentsByUser: ${JSON.stringify(issueCommentsByUser)}`);
Expand Down Expand Up @@ -172,7 +173,7 @@ export const incentivizeCreatorComment = async () => {
return;
}

const description = await getIssueDescription(issue.number, "html");
const description = await getIssueDescription(issue.number);
if (!description) {
logger.info(`Skipping to generate a permit url because issue description is empty. description: ${description}`);
return;
Expand Down Expand Up @@ -243,28 +244,63 @@ const generatePermitForComments = async (
* @param incentives - The basic price table for reward calculation
* @returns - The reward value
*/
const calculateRewardValue = (comments: Record<string, string[]>, incentives: Incentives): Decimal => {
const calculateRewardValue = (comments: Record<MarkdownItem, string[]>, incentives: Incentives): Decimal => {
let sum = new Decimal(0);
for (const key of Object.keys(comments)) {
const value = comments[key];
for (const item of MarkdownItems) {
const value = comments[item];

// if it's a text node calculate word count and multiply with the reward value
if (key == "#text") {
if (item === MarkdownItem.Text) {
if (!incentives.comment.totals.word) {
continue;
}
const wordReward = new Decimal(incentives.comment.totals.word);
const reward = wordReward.mul(value.map((str) => str.trim().split(" ").length).reduce((totalWords, wordCount) => totalWords + wordCount, 0));
sum = sum.add(reward);
} else {
if (!incentives.comment.elements[key]) {
const htmlTag = MarkdownItemToHTMLTag[item];
if (!htmlTag || !incentives.comment.elements[htmlTag]) {
continue;
}
const rewardValue = new Decimal(incentives.comment.elements[key]);
const rewardValue = new Decimal(incentives.comment.elements[htmlTag]);
const reward = rewardValue.mul(value.length);
sum = sum.add(reward);
}
}

return sum;
};

const MarkdownItemToHTMLTag: Record<MarkdownItem, string> = {
[MarkdownItem.Text]: HTMLItem.P,
[MarkdownItem.Paragraph]: HTMLItem.P,
[MarkdownItem.Heading]: HTMLItem.H1,
[MarkdownItem.Heading1]: HTMLItem.H1,
[MarkdownItem.Heading2]: HTMLItem.H2,
[MarkdownItem.Heading3]: HTMLItem.H3,
[MarkdownItem.Heading4]: HTMLItem.H4,
[MarkdownItem.Heading5]: HTMLItem.H5,
[MarkdownItem.Heading6]: HTMLItem.H6,
[MarkdownItem.ListItem]: HTMLItem.LI,
[MarkdownItem.List]: HTMLItem.UL,
[MarkdownItem.Link]: HTMLItem.A,
[MarkdownItem.Image]: HTMLItem.IMG,
[MarkdownItem.BlockQuote]: HTMLItem.BLOCKQUOTE,
[MarkdownItem.Code]: HTMLItem.PRE,
Copy link
Collaborator Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I'm not sure if it's gonna be clear to partners that <pre> refers to

code

and <code> refers to inline code

[MarkdownItem.Emphasis]: HTMLItem.EM,
[MarkdownItem.Strong]: HTMLItem.STRONG,
[MarkdownItem.Delete]: HTMLItem.DEL,
[MarkdownItem.HTML]: HTMLItem.HTML,
[MarkdownItem.InlineCode]: HTMLItem.CODE,
[MarkdownItem.LinkReference]: HTMLItem.A,
[MarkdownItem.ImageReference]: HTMLItem.IMG,
[MarkdownItem.FootnoteReference]: HTMLItem.SUP,
[MarkdownItem.FootnoteDefinition]: HTMLItem.P,
Copy link
Collaborator Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I'm not sure how can we represent footnote reference and definition by HTML? @pavlovcik

Example of footnote1

Footnotes

  1. Footnote 1

Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Very cool. I didn't know about this but I guess we can just file an issue and kick the can down the road?

[MarkdownItem.Table]: HTMLItem.TABLE,
[MarkdownItem.TableCell]: HTMLItem.TD,
[MarkdownItem.TableRow]: HTMLItem.TR,
[MarkdownItem.ThematicBreak]: HTMLItem.HR,
[MarkdownItem.Break]: HTMLItem.BR,
[MarkdownItem.Root]: HTMLItem.HTML,
[MarkdownItem.Definition]: HTMLItem.DL,
};
85 changes: 66 additions & 19 deletions src/helpers/comment.ts
Original file line number Diff line number Diff line change
@@ -1,42 +1,89 @@
import * as parse5 from "parse5";
import { MarkdownItem } from "../types";
import fromMarkdown from "mdast-util-from-markdown";
import gfmFromMarkdown from "mdast-util-gfm";
import gfm from "micromark-extension-gfm";

type Node = {
nodeName: string;
tagName?: string;
value?: string;
childNodes?: Node[];
type: MarkdownItem;
value: string;
depth?: number;
children: Node[];
};

const traverse = (result: Record<string, string[]>, node: Node, itemsToExclude: string[]): Record<string, string[]> => {
if (itemsToExclude.includes(node.nodeName)) {
return result;
const traverse = (result: Record<MarkdownItem, string[]>, node: Node, itemsToExclude: string[]): Record<MarkdownItem, string[]> => {
if (!result[node.type]) {
result[node.type] = [];
}

if (!result[node.nodeName]) {
result[node.nodeName] = [];
if (node.type === MarkdownItem.Heading) {
node.type = `heading${node.depth}` as MarkdownItem;
}

result[node.nodeName].push(node.value?.trim() ?? "");
result[node.type].push(node.value?.trim() ?? "");

if (itemsToExclude.includes(node.type)) {
return result;
}

if (node.childNodes && node.childNodes.length > 0) {
node.childNodes.forEach((child) => traverse(result, child, itemsToExclude));
if (node.children && node.children.length > 0) {
node.children.forEach((child) => traverse(result, child, itemsToExclude));
}

return result;
};

export const parseComments = (comments: string[], itemsToExclude: string[]): Record<string, string[]> => {
const result: Record<string, string[]> = {};
export const parseComments = async (comments: string[], itemsToExclude: string[]): Promise<Record<MarkdownItem, string[]>> => {
const result: Record<MarkdownItem, string[]> = {
[MarkdownItem.Text]: [],
[MarkdownItem.Paragraph]: [],
[MarkdownItem.Heading]: [],
[MarkdownItem.Heading1]: [],
[MarkdownItem.Heading2]: [],
[MarkdownItem.Heading3]: [],
[MarkdownItem.Heading4]: [],
[MarkdownItem.Heading5]: [],
[MarkdownItem.Heading6]: [],
[MarkdownItem.ListItem]: [],
[MarkdownItem.List]: [],
[MarkdownItem.Link]: [],
[MarkdownItem.Image]: [],
[MarkdownItem.BlockQuote]: [],
[MarkdownItem.Code]: [],
[MarkdownItem.Emphasis]: [],
[MarkdownItem.Strong]: [],
[MarkdownItem.Delete]: [],
[MarkdownItem.HTML]: [],
[MarkdownItem.InlineCode]: [],
[MarkdownItem.LinkReference]: [],
[MarkdownItem.ImageReference]: [],
[MarkdownItem.FootnoteReference]: [],
[MarkdownItem.FootnoteDefinition]: [],
[MarkdownItem.Table]: [],
[MarkdownItem.TableCell]: [],
[MarkdownItem.TableRow]: [],
[MarkdownItem.ThematicBreak]: [],
[MarkdownItem.Break]: [],
[MarkdownItem.Root]: [],
[MarkdownItem.Definition]: [],
};

for (const comment of comments) {
const fragment = parse5.parseFragment(comment);
traverse(result, fragment as Node, itemsToExclude);
const tree = fromMarkdown(comment, {
extensions: [gfm()],
mdastExtensions: [gfmFromMarkdown.fromMarkdown],
});
console.log(`Comment Mdast Tree: ${JSON.stringify(tree, null, 2)}`);
traverse(result, tree as Node, itemsToExclude);
}

console.log(`Comment Parsed: ${JSON.stringify(result, null, 2)}`);

// remove empty values
if (result["#text"]) {
result["#text"] = result["#text"].filter((str) => str.length > 0);
if (result[MarkdownItem.Text]) {
result[MarkdownItem.Text] = result[MarkdownItem.Text].filter((str) => str.length > 0);
}

console.log(`Comment Parsed Cleaned: ${JSON.stringify(result, null, 2)}`);

return result;
};
27 changes: 27 additions & 0 deletions src/types/html.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
export enum HTMLItem {
P = "p",
H1 = "h1",
H2 = "h2",
H3 = "h3",
H4 = "h4",
H5 = "h5",
H6 = "h6",
UL = "ul",
A = "a",
IMG = "img",
BLOCKQUOTE = "blockquote",
CODE = "code",
EM = "em",
STRONG = "strong",
DEL = "del",
HTML = "html",
SUP = "sup",
LI = "li",
TABLE = "table",
TR = "tr",
TD = "td",
HR = "hr",
BR = "br",
DL = "dl",
PRE = "pre",
}
80 changes: 70 additions & 10 deletions src/types/markdown.ts
Original file line number Diff line number Diff line change
@@ -1,10 +1,70 @@
export const MarkdownItem = {
Paragraph: "paragraph",
List: "list",
Link: "link",
Text: "text",
Code: "code",
Image: "image",
BlockQuote: "blockquote",
} as const;
export type MarkdownItem = (typeof MarkdownItem)[keyof typeof MarkdownItem];
// All types supported by standard Markdown and GFM
export enum MarkdownItem {
// Standard Markdown
BlockQuote = "blockquote",
Break = "break",
Code = "code",
Definition = "definition",
Emphasis = "emphasis",
Heading = "heading",
HTML = "html",
Image = "image",
ImageReference = "imageReference",
InlineCode = "inlineCode",
Link = "link",
LinkReference = "linkReference",
List = "list",
ListItem = "listItem",
Paragraph = "paragraph",
Root = "root",
Strong = "strong",
Text = "text",
ThematicBreak = "thematicBreak",
// GFM
Delete = "delete",
FootnoteDefinition = "footnoteDefinition",
FootnoteReference = "footnoteReference",
Table = "table",
TableCell = "tableCell",
TableRow = "tableRow",
// Our custom types to make it compatible with HTML
Heading1 = "heading1",
Heading2 = "heading2",
Heading3 = "heading3",
Heading4 = "heading4",
Heading5 = "heading5",
Heading6 = "heading6",
}
export const MarkdownItems = [
MarkdownItem.BlockQuote,
MarkdownItem.Break,
MarkdownItem.Code,
MarkdownItem.Definition,
MarkdownItem.Emphasis,
MarkdownItem.Heading,
MarkdownItem.HTML,
MarkdownItem.Image,
MarkdownItem.ImageReference,
MarkdownItem.InlineCode,
MarkdownItem.Link,
MarkdownItem.LinkReference,
MarkdownItem.List,
MarkdownItem.ListItem,
MarkdownItem.Paragraph,
MarkdownItem.Root,
MarkdownItem.Strong,
MarkdownItem.Text,
MarkdownItem.ThematicBreak,
MarkdownItem.Delete,
MarkdownItem.FootnoteDefinition,
MarkdownItem.FootnoteReference,
MarkdownItem.Table,
MarkdownItem.TableCell,
MarkdownItem.TableRow,
MarkdownItem.Heading1,
MarkdownItem.Heading2,
MarkdownItem.Heading3,
MarkdownItem.Heading4,
MarkdownItem.Heading5,
MarkdownItem.Heading6,
] as const;
Loading