Skip to content

Commit fe6eb8d

Browse files
committed
A few more tweaks
1 parent c2e5c8d commit fe6eb8d

File tree

4 files changed

+30
-21
lines changed

4 files changed

+30
-21
lines changed

evals/apps/web/src/app/home.tsx

Lines changed: 19 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -1,14 +1,14 @@
11
"use client"
22

3+
import { useMemo } from "react"
34
import { useRouter } from "next/navigation"
4-
import { Rocket } from "lucide-react"
5+
import Link from "next/link"
6+
import { ChevronRight, Rocket } from "lucide-react"
57

68
import type { Run, TaskMetrics } from "@evals/db"
79

8-
import { formatCurrency, formatDuration } from "@/lib"
10+
import { formatCurrency, formatDuration, formatTokens } from "@/lib"
911
import { Button, Table, TableBody, TableCell, TableHead, TableHeader, TableRow } from "@/components/ui"
10-
import { useMemo } from "react"
11-
import Link from "next/link"
1212

1313
export function Home({ runs }: { runs: (Run & { taskMetrics: TaskMetrics | null })[] }) {
1414
const router = useRouter()
@@ -20,32 +20,39 @@ export function Home({ runs }: { runs: (Run & { taskMetrics: TaskMetrics | null
2020
<Table className="border border-t-0">
2121
<TableHeader>
2222
<TableRow>
23-
<TableHead>ID</TableHead>
2423
<TableHead>Model</TableHead>
25-
<TableHead>Timestamp</TableHead>
2624
<TableHead>Passed</TableHead>
2725
<TableHead>Failed</TableHead>
2826
<TableHead>% Correct</TableHead>
27+
<TableHead className="text-center">Tokens In / Out</TableHead>
2928
<TableHead>Cost</TableHead>
3029
<TableHead>Duration</TableHead>
30+
<TableHead />
3131
</TableRow>
3232
</TableHeader>
3333
<TableBody>
3434
{visibleRuns.length ? (
3535
visibleRuns.map(({ taskMetrics, ...run }) => (
3636
<TableRow key={run.id}>
37-
<TableCell>
38-
<Button variant="link" asChild>
39-
<Link href={`/runs/${run.id}`}>{run.id}</Link>
40-
</Button>
41-
</TableCell>
4237
<TableCell>{run.model}</TableCell>
43-
<TableCell>{new Date(run.createdAt).toLocaleString()}</TableCell>
4438
<TableCell>{run.passed}</TableCell>
4539
<TableCell>{run.failed}</TableCell>
4640
<TableCell>{((run.passed / (run.passed + run.failed)) * 100).toFixed(1)}%</TableCell>
41+
<TableCell>
42+
<div className="flex items-center justify-evenly">
43+
<div>{formatTokens(taskMetrics!.tokensIn)}</div>/
44+
<div>{formatTokens(taskMetrics!.tokensOut)}</div>
45+
</div>
46+
</TableCell>
4747
<TableCell>{formatCurrency(taskMetrics!.cost)}</TableCell>
4848
<TableCell>{formatDuration(taskMetrics!.duration)}</TableCell>
49+
<TableCell>
50+
<Button variant="ghost" size="icon" asChild>
51+
<Link href={`/runs/${run.id}`}>
52+
<ChevronRight />
53+
</Link>
54+
</Button>
55+
</TableCell>
4956
</TableRow>
5057
))
5158
) : (

evals/apps/web/src/app/runs/[id]/run.tsx

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ export function Run({ run }: { run: db.Run }) {
3737
<div>{run.model}</div>
3838
{run.description && <div className="text-sm text-muted-foreground">{run.description}</div>}
3939
</div>
40-
<ConnectionStatus status={status} pid={run.pid} />
40+
{!run.taskMetricsId && <ConnectionStatus status={status} pid={run.pid} />}
4141
</div>
4242
{!tasks ? (
4343
<LoaderCircle className="size-4 animate-spin" />

evals/apps/web/src/lib/format-tokens.ts

Lines changed: 9 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,5 +3,13 @@ export const formatTokens = (tokens: number) => {
33
return tokens.toString()
44
}
55

6-
return `${(tokens / 1000).toFixed(1)}k`
6+
if (tokens < 1000000) {
7+
return `${(tokens / 1000).toFixed(1)}k`
8+
}
9+
10+
if (tokens < 1000000000) {
11+
return `${(tokens / 1000000).toFixed(1)}M`
12+
}
13+
14+
return `${(tokens / 1000000000).toFixed(1)}B`
715
}

evals/packages/types/src/roo-code.ts

Lines changed: 1 addition & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -270,12 +270,7 @@ export type CustomSupportPrompts = z.infer<typeof customSupportPromptsSchema>
270270
* ExperimentId
271271
*/
272272

273-
export const experimentIds = [
274-
"search_and_replace",
275-
"insert_content",
276-
"powerSteering",
277-
"multi_search_and_replace",
278-
] as const
273+
export const experimentIds = ["search_and_replace", "insert_content", "powerSteering"] as const
279274

280275
export const experimentIdsSchema = z.enum(experimentIds)
281276

@@ -289,7 +284,6 @@ const experimentsSchema = z.object({
289284
search_and_replace: z.boolean(),
290285
insert_content: z.boolean(),
291286
powerSteering: z.boolean(),
292-
multi_search_and_replace: z.boolean(),
293287
})
294288

295289
export type Experiments = z.infer<typeof experimentsSchema>

0 commit comments

Comments
 (0)