Skip to content

Commit

Permalink
add chakra
Browse files Browse the repository at this point in the history
  • Loading branch information
bat-kryptonyte committed Jul 21, 2023
1 parent 69cb69d commit 474915e
Show file tree
Hide file tree
Showing 7 changed files with 1,523 additions and 18 deletions.
5 changes: 5 additions & 0 deletions package.json
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,9 @@
"lint": "next lint"
},
"dependencies": {
"@chakra-ui/react": "^2.8.0",
"@emotion/react": "^11.11.1",
"@emotion/styled": "^11.11.0",
"@types/node": "20.4.1",
"@types/react": "18.2.14",
"@types/react-dom": "18.2.6",
Expand All @@ -18,6 +21,7 @@
"eslint": "8.44.0",
"eslint-config-next": "13.4.9",
"extract-mongo-schema": "^0.2.11",
"framer-motion": "^10.13.0",
"husky": "^8.0.3",
"lint-staged": "^13.2.3",
"mongoose": "^7.3.3",
Expand All @@ -26,6 +30,7 @@
"prettier": "^3.0.0",
"react": "18.2.0",
"react-dom": "18.2.0",
"react-icons": "^4.10.1",
"tailwindcss": "3.3.2",
"typescript": "5.1.6"
},
Expand Down
7 changes: 6 additions & 1 deletion src/pages/_app.tsx
Original file line number Diff line number Diff line change
@@ -1,6 +1,11 @@
import "@/styles/globals.css";
import type { AppProps } from "next/app";
import { ChakraProvider } from "@chakra-ui/react";

export default function App({ Component, pageProps }: AppProps) {
return <Component {...pageProps} />;
return (
<ChakraProvider>
<Component {...pageProps} />
</ChakraProvider>
);
}
8 changes: 2 additions & 6 deletions src/pages/index.tsx
Original file line number Diff line number Diff line change
@@ -1,7 +1,3 @@
const Index = () => {
return <></>;
};
import Arb from "../screens/ARB";

Index.title = "ARB Problems Interface";

export default Index;
export default Arb;
195 changes: 195 additions & 0 deletions src/screens/ARB/Arb.tsx
Original file line number Diff line number Diff line change
@@ -0,0 +1,195 @@
import React from "react";
import {
Box,
Flex,
Link,
Heading,
Text,
IconButton,
Button,
Container,
Icon,
} from "@chakra-ui/react";
import { FaHome, FaFilePdf, FaGithub, FaImages } from "react-icons/fa";
import { AiFillFile } from "react-icons/ai";

const Arb: React.FC = () => {
return (
<Box>
<Flex
as="nav"
align="center"
justify="center"
wrap="wrap"
padding={6}
bg="teal.500"
>
<Box
flexBasis={{ base: "100%", md: "auto" }}
flexGrow={1}
textAlign={{ base: "center", md: "left" }}
>
<Link href="https://duckai.org" color="white">
<Icon as={FaHome} w={6} h={6} />
</Link>
</Box>
</Flex>

<Box as="section" bg="gray.100" py={10}>
<Container maxW="container.md">
<Flex direction="column" align="center">
<Heading as="h1" size="2xl">
ARB: Advanced Reasoning Benchmark for Large Language Models
</Heading>

<Text fontSize="lg" mt={4}>
<Link href="https://tomohiro-sawada.github.io/" color="teal.500">
Tomohiro Sawada
</Link>
<sup>1,2</sup>,
<Link href="https://danielpaleka.com/" color="teal.500" ml={2}>
Daniel Paleka
</Link>
<sup>1,3</sup>,
<Link href="https://dahoas.github.io/" color="teal.500" ml={2}>
Alexander Havrilla
</Link>
<sup>1,2</sup>,
<Link href="https://pranav.cc/" color="teal.500" ml={2}>
Pranav Tadepalli
</Link>
<sup>1,2</sup>,
<Link href="#" color="teal.500" ml={2}>
Paula Vidas
</Link>
<sup>1</sup>,
<Link
href="https://alexkranias.com/index.html"
color="teal.500"
ml={2}
>
Alexander Kranias
</Link>
<sup>1,2</sup>,
<Link href="http://johnjnay.com/" color="teal.500" ml={2}>
John J Nay
</Link>
<sup>1</sup>,
<Link href="https://kshitijkg.github.io/" color="teal.500" ml={2}>
Kshitij Gupta
</Link>
<sup>1,4</sup>,
<Link
href="https://twitter.com/arankomatsuzaki"
color="teal.500"
ml={2}
>
Aran Komatsuzaki
</Link>
<sup>1,2</sup>
</Text>

<Text fontSize="lg" mt={2}>
<Link href="https://duckai.org" color="teal.500">
DuckAI
</Link>
, Georgia Institute of Technology, ETH Zürich, Mila - Quebec AI
Institute
</Text>

<Flex mt={4}>
<Button
leftIcon={<FaFilePdf />}
colorScheme="teal"
variant="solid"
>
Paper
</Button>
<Button
leftIcon={<AiFillFile />}
colorScheme="teal"
variant="solid"
ml={4}
>
arXiv
</Button>
<Button
leftIcon={<FaGithub />}
colorScheme="teal"
variant="solid"
ml={4}
>
Code
</Button>
<Button
leftIcon={<FaImages />}
colorScheme="teal"
variant="solid"
ml={4}
>
Dataset
</Button>
</Flex>
</Flex>
</Container>
</Box>

<Box as="section" py={10}>
<Container maxW="container.md">
<Flex direction="column" align="center">
<Heading as="h2" size="lg">
Abstract
</Heading>

<Text textAlign="justify" mt={4} w="4/5">
Large Language Models (LLMs) have demonstrated remarkable
performance on various quantitative reasoning and knowledge
benchmarks, such as MMLU and MATH. However, many of these
benchmarks are losing utility as LLMs get increasingly high
scores, despite not yet achieving expert level performance in
these domains. We introduce ARB, a novel benchmark composed of
advanced reasoning problems designed to evaluate LLMs on text
comprehension and expert domain reasoning. ARB presents a more
challenging test than prior benchmarks, featuring questions that
test deeper knowledge of mathematics, physics, biology, chemistry,
and law.
</Text>

<Text textAlign="justify" mt={4} w="4/5">
As a subset of ARB, we introduce a challenging set of math and
physics problems which require advanced symbolic reasoning and
domain knowledge. In order to improve both automatic and assisted
symbolic evaluation capabilities, we introduce a rubric-based
self-evaluation approach, allowing GPT-4 to score its own
intermediate reasoning steps.
</Text>

<Text textAlign="justify" mt={4} w="4/5">
We evaluate recent models such as GPT-4 and Claude on ARB and
demonstrate that even with Chain-of-Thought prompting methods,
current models score well below 50% on more demanding expert
tasks. Further, we conduct a human evaluation of the symbolic
subset of ARB, finding close agreement between annotators and
GPT-4 self-evaluation scores.
</Text>
</Flex>
</Container>
</Box>

{/* ... additional sections ... */}
{/* Footer */}
<Flex
as="footer"
align="center"
justify="center"
wrap="wrap"
padding={6}
bg="teal.500"
>
{/* Footer content here... */}
</Flex>
</Box>
);
};

export default Arb;
3 changes: 3 additions & 0 deletions src/screens/ARB/index.tsx
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
import Arb from "./Arb";

export default Arb;
9 changes: 6 additions & 3 deletions src/screens/Home/Home.tsx
Original file line number Diff line number Diff line change
Expand Up @@ -63,17 +63,16 @@ export default function Home() {
setProblem(data["randomProblem"]);
});
};

console.log("Problem Statement:", problemStatement);
useEffect(() => {
if (problem) {
if (isNumericalProblem(problem)) {
setProblemStatement(problem.Problem_Statement);
setFinalAnswer(problem["Final Answer"]);
} else {
setProblemStatement(problem["Problem Statement"]);
setAnswerCandidates(problem["Answer Candidates"]);
setFinalAnswer(problem["Final Answer"]);
}
setFinalAnswer(problem["Final Answer"]);
}
}, [problem]);

Expand Down Expand Up @@ -105,6 +104,10 @@ export default function Home() {
return <div>Loading...</div>;
}

console.log("Problem Statement:", problemStatement);

console.log("Final Answer:", finalAnswer);

return (
<div className={styles.container}>
<h1>Select Problem Type</h1>
Expand Down
Loading

0 comments on commit 474915e

Please sign in to comment.