Skip to content

Commit

Permalink
update ui
Browse files Browse the repository at this point in the history
  • Loading branch information
xzyaoi committed Jan 13, 2025
1 parent c9825e2 commit 1fc5191
Show file tree
Hide file tree
Showing 11 changed files with 29 additions and 37 deletions.
2 changes: 1 addition & 1 deletion frontend/src/components/ArrowCard.astro
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
import type { CollectionEntry } from "astro:content";
type Props = {
entry: CollectionEntry<"docs"> | CollectionEntry<"articles">;
entry: CollectionEntry<"guides"> | CollectionEntry<"articles">;
}
const { entry } = Astro.props;
Expand Down
4 changes: 2 additions & 2 deletions frontend/src/components/Header.astro
Original file line number Diff line number Diff line change
Expand Up @@ -13,13 +13,13 @@ import { SITE } from "@consts";
</div>
</Link>
<nav class="flex gap-1">
<Link href="/docs">
<Link href="/guides">
Docs
</Link>
<span>
{`/`}
</span>
<Link href="/research">
<Link href="/articles">
Research
</Link>
</nav>
Expand Down
23 changes: 4 additions & 19 deletions frontend/src/consts.ts
Original file line number Diff line number Diff line change
Expand Up @@ -10,12 +10,12 @@ export const SITE: Site = {

export const HOME: Metadata = {
TITLE: "Home",
DESCRIPTION: "Astro Nano is a minimal and lightweight blog and portfolio.",
DESCRIPTION: "Serving Platform @ SwissAI Initiative",
};

export const ARTICLES: Metadata = {
TITLE: "Articles",
DESCRIPTION: "A collection of articles on topics I am passionate about.",
DESCRIPTION: "A collection of research articles about efficient ML.",
};

export const WORK: Metadata = {
Expand All @@ -25,20 +25,5 @@ export const WORK: Metadata = {

export const DOCS: Metadata = {
TITLE: "Docs",
DESCRIPTION: "A collection of my projects, with links to repositories and demos.",
};

export const SOCIALS: Socials = [
{
NAME: "twitter-x",
HREF: "https://twitter.com/markhorn_dev",
},
{
NAME: "github",
HREF: "https://github.com/markhorn-dev"
},
{
NAME: "linkedin",
HREF: "https://www.linkedin.com/in/markhorn-dev",
}
];
DESCRIPTION: "A collection of guides.",
};
10 changes: 7 additions & 3 deletions frontend/src/content/articles/01-getting-started/index.md
Original file line number Diff line number Diff line change
@@ -1,7 +1,11 @@
---
title: "Getting started"
description: "Hit the ground running."
title: "DeltaZip: Multi Full Fine-tuned LLM Serving"
description: "Fine-tuning large language models (LLMs) greatly improves model quality for downstream tasks. However, serving many fine-tuned LLMs concurrently is challenging due to the sporadic, bursty, and varying request patterns of different LLMs. To bridge this gap, we present DeltaZip, an LLM serving system that efficiently serves multiple full-parameter fine-tuned models concurrently by aggressively compressing model deltas by up to 10x while maintaining high model quality. The key insight behind this design is that fine-tuning results in small-magnitude changes to the pre-trained model. By co-designing the serving system with the compression algorithm, DeltaZip achieves 2x to 12x improvement in throughput compared to the state-of-the-art systems."
date: "Mar 22 2024"
demoURL: "https://arxiv.org/abs/2312.05215"
repoURL: "https://github.com/eth-easl/deltazip"
---

This is a test article.
[Model Zoo](https://huggingface.co/deltazip).

Fine-tuning large language models (LLMs) greatly improves model quality for downstream tasks. However, serving many fine-tuned LLMs concurrently is challenging due to the sporadic, bursty, and varying request patterns of different LLMs. To bridge this gap, we present DeltaZip, an LLM serving system that efficiently serves multiple full-parameter fine-tuned models concurrently by aggressively compressing model deltas by up to 10x while maintaining high model quality. The key insight behind this design is that fine-tuning results in small-magnitude changes to the pre-trained model. By co-designing the serving system with the compression algorithm, DeltaZip achieves 2x to 12x improvement in throughput compared to the state-of-the-art systems.
4 changes: 2 additions & 2 deletions frontend/src/content/config.ts
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
import { defineCollection, z } from "astro:content";

const docs = defineCollection({
const guides = defineCollection({
type: "content",
schema: z.object({
title: z.string(),
Expand All @@ -22,4 +22,4 @@ const articles = defineCollection({
}),
});

export const collections = { docs, articles };
export const collections = { guides, articles };
4 changes: 2 additions & 2 deletions frontend/src/pages/articles/[...slug].astro
Original file line number Diff line number Diff line change
Expand Up @@ -46,15 +46,15 @@ const { Content } = await project.render();
<nav class="animate flex gap-1">
{project.data.demoURL && (
<Link href={project.data.demoURL} external>
demo
Paper
</Link>
)}
{project.data.demoURL && project.data.repoURL && (
<span>/</span>
)}
{project.data.repoURL && (
<Link href={project.data.repoURL} external>
repo
Repo
</Link>
)}
</nav>
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -7,15 +7,15 @@ import { readingTime } from "@lib/utils";
import BackToPrev from "@components/BackToPrev.astro";
export async function getStaticPaths() {
const posts = (await getCollection("docs"))
const posts = (await getCollection("guides"))
.filter(post => !post.data.draft)
.sort((a, b) => b.data.date.valueOf() - a.data.date.valueOf());
return posts.map((post) => ({
params: { slug: post.slug },
props: post,
}));
}
type Props = CollectionEntry<"docs">;
type Props = CollectionEntry<"guides">;
const post = Astro.props;
const { Content } = await post.render();
Expand All @@ -24,7 +24,7 @@ const { Content } = await post.render();
<PageLayout title={post.data.title} description={post.data.description}>
<Container>
<div class="animate">
<BackToPrev href="/docs">
<BackToPrev href="/guides">
Back to docs
</BackToPrev>
</div>
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -5,12 +5,12 @@ import Container from "@components/Container.astro";
import ArrowCard from "@components/ArrowCard.astro";
import { DOCS } from "@consts";
const data = (await getCollection("docs"))
const data = (await getCollection("guides"))
.filter(post => !post.data.draft)
.sort((a, b) => b.data.date.valueOf() - a.data.date.valueOf());
type Acc = {
[year: string]: CollectionEntry<"docs">[];
[year: string]: CollectionEntry<"guides">[];
}
const posts = data.reduce((acc: Acc, post) => {
Expand Down
7 changes: 5 additions & 2 deletions frontend/src/pages/index.astro
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@ import Link from "@components/Link.astro";
import { dateRange } from "@lib/utils";
import { SITE, HOME } from "@consts";
const docs = (await getCollection("docs"))
const docs = (await getCollection("guides"))
.filter(post => !post.data.draft)
.sort((a, b) => b.data.date.valueOf() - a.data.date.valueOf())
.slice(0,SITE.NUM_POSTS_ON_HOMEPAGE);
Expand Down Expand Up @@ -48,13 +48,16 @@ const articles = (await getCollection("articles"))
<button class="bg-blue-500 hover:bg-blue-700 text-white font-bold py-2 px-4 rounded">
<a href="/login">Login</a>
</button>
<button class="bg-gray-500 hover:bg-blue-700 text-white font-bold py-2 px-4 rounded">
<a href="/chat">Chat</a>
</button>
</section>
<section class="animate space-y-6">
<div class="flex flex-wrap gap-y-2 items-center justify-between">
<h5 class="font-semibold text-black dark:text-white">
Documentation
</h5>
<Link href="/docs">
<Link href="/guides">
See all docs
</Link>
</div>
Expand Down
2 changes: 1 addition & 1 deletion frontend/src/pages/rss.xml.ts
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@ type Context = {
}

export async function GET(context: Context) {
const docs = (await getCollection("docs"))
const docs = (await getCollection("guides"))
.filter(post => !post.data.draft);

const articles = (await getCollection("articles"))
Expand Down

0 comments on commit 1fc5191

Please sign in to comment.