chore: add dewhale based helper

Yuyz0112 · Yuyz0112 · commit 381366096163 · 2025-06-09T17:12:47.000+08:00
diff --git a/.dewhale/characters/Collector.yaml b/.dewhale/characters/Collector.yaml
@@ -0,0 +1,23 @@
+name: ModelCatalogCollector
+labels:
+  - "collect-model"
+  - "hf2catalog"
+systemPrompt: |
+  You are Neutree AI Model Catalog Collector, responsible for helping users convert HuggingFace model repositories into standardized model catalog configurations.
+
+  Your primary task is to collect HuggingFace repository URLs from users and generate corresponding model catalog YAML configurations using the hf2catalog tool.
+
+  A typical workflow is as follows:
+    1. When a user provides a HuggingFace model repository URL (like https://huggingface.co/microsoft/DialoGPT-medium), immediately process it without asking for confirmation.
+    2. Use the `hf2catalog` tool to convert the URL into a model catalog configuration, always using YAML output format.
+    3. Present the results in a clean, formatted YAML code block for easy copy-paste usage.
+    4. Be proactive and efficient - complete the entire process in one interaction when possible, avoiding unnecessary back-and-forth confirmations.
+
+  Key guidelines:
+    - Always output results in YAML format (never ask users to specify output format)
+    - Wrap the final catalog configuration in a ```yaml code block for better readability
+    - Handle multiple URLs in a single request if provided
+    - Provide brief context about what the generated catalog contains (model type, engine, etc.)
+    - If a URL is invalid or the model is unsupported, explain the issue and suggest alternatives
+
+  Remember: Your goal is to make the model catalog generation process as smooth and efficient as possible for users.
diff --git a/.dewhale/config.yaml b/.dewhale/config.yaml
@@ -0,0 +1,14 @@
+llm:
+  provider: google
+  model: gemini-2.0-flash
+  maxTokens: 8192
+  maxSteps: 3
+  maxRetries: 5
+mcp:
+  servers:
+    - type: stdio
+      command: deno
+      args:
+        - run
+        - "-A"
+        - jsr:@arcfra/neutree-mcp-servers/servers/hf2catalog
diff --git a/scripts/hf2catalog.ts b/scripts/hf2catalog.ts
@@ -9,233 +9,8 @@
  */
 
 import { parse } from "https://deno.land/std@0.224.0/flags/mod.ts";
-import * as yaml from "https://deno.land/std@0.224.0/yaml/mod.ts";
+import { hf2catalog } from "jsr:@arcfra/neutree-mcp-servers@0.3.0/servers/hf2catalog/hf2catalog";
 
-// -----------------------------
-// Types & Constants
-// -----------------------------
-interface SiblingFile {
-  rfilename: string; // full relative filename in repo
-  size: number;
-}
-
-interface HFModelMeta {
-  // subset of HF /api/models response we care about
-  pipeline_tag?: string;
-  siblings: SiblingFile[];
-  id?: string; // full model name like "microsoft/DialoGPT-medium"
-  author?: string; // author/organization name
-  cardData?: {
-    thumbnail?: string; // icon/thumbnail URL
-  };
-}
-
-const DEFAULT_SCHEDULER = {
-  type: "consistent_hash",
-  virtual_nodes: 150,
-  load_factor: 1.25,
-};
-
-// Supported model tasks
-const TEXT_GENERATION_TASK = "text-generation";
-const TEXT_EMBEDDING_TASK = "text-embedding";
-const TEXT_RERANK_TASK = "text-rerank";
-
-const SUPPORTED_TASKS = [
-  TEXT_GENERATION_TASK,
-  TEXT_EMBEDDING_TASK,
-  TEXT_RERANK_TASK,
-] as const;
-
-// Mapping from HuggingFace pipeline tags to our supported tasks
-// Keep this mapping conservative - only include well-established mappings
-const HF_PIPELINE_TO_TASK_MAP: Record<string, string> = {
-  // Text generation - only the most common ones
-  "text-generation": TEXT_GENERATION_TASK,
-
-  // Text embedding - only exact matches and feature-extraction (widely used)
-  "feature-extraction": TEXT_EMBEDDING_TASK,
-  "text-embedding": TEXT_EMBEDDING_TASK,
-  "sentence-similarity": TEXT_EMBEDDING_TASK,
-
-  // Text rerank - only exact match
-  "text-rerank": TEXT_RERANK_TASK,
-};
-
-// vLLM best-practice args (can be tuned globally here)
-const DEFAULT_VLLM_ARGS = {
-  tensor_parallel_size: 1,
-  max_model_len: 32768,
-  enforce_eager: true,
-  gpu_memory_utilization: 0.95,
-  enable_chunked_prefill: true,
-};
-
-// -----------------------------
-// Helpers
-// -----------------------------
-function fatal(msg: string): never {
-  console.error(`Error: ${msg}`);
-  Deno.exit(1);
-}
-
-function mapHFPipelineToTask(pipelineTag?: string): string {
-  if (!pipelineTag) {
-    fatal("Model pipeline_tag is missing. Cannot determine task type.");
-  }
-
-  const mappedTask = HF_PIPELINE_TO_TASK_MAP[pipelineTag];
-  if (!mappedTask) {
-    const supportedPipelines = Object.keys(HF_PIPELINE_TO_TASK_MAP).join(", ");
-    fatal(
-      `Unsupported pipeline tag: "${pipelineTag}". ` +
-        `Supported pipeline tags: ${supportedPipelines}. ` +
-        `Only tasks [${SUPPORTED_TASKS.join(", ")}] are supported.`
-    );
-  }
-
-  return mappedTask;
-}
-
-function parseRepoUrl(url: string): { owner: string; repo: string } {
-  try {
-    const u = new URL(url.replace(/\/$/, ""));
-    if (u.hostname !== "huggingface.co") {
-      throw new Error("Not a huggingface.co URL");
-    }
-    const segments = u.pathname.replace(/^\/+/, "").split("/");
-    if (segments.length < 2) throw new Error("URL missing owner or repo");
-    return { owner: segments[0], repo: segments[1] };
-  } catch (e: unknown) {
-    fatal((e as Error).message);
-  }
-}
-
-async function fetchModelMeta(
-  owner: string,
-  repo: string
-): Promise<HFModelMeta> {
-  const apiUrl = `https://huggingface.co/api/models/${owner}/${repo}`;
-  const res = await fetch(apiUrl);
-  if (!res.ok) fatal(`HF API request failed: ${res.status} ${res.statusText}`);
-  return await res.json();
-}
-
-function pickFile(siblings: SiblingFile[], ext: string): string | undefined {
-  return siblings.find((s) => s.rfilename.endsWith(ext))?.rfilename;
-}
-
-function selectPrimaryFile(meta: HFModelMeta): {
-  engine: "vllm" | "llama-cpp";
-  file: string;
-} {
-  const ggufFile = pickFile(meta.siblings, ".gguf");
-  if (ggufFile) {
-    return { engine: "llama-cpp", file: ggufFile };
-  }
-
-  // Prefer first shard of a safetensors split, else any safetensors
-  const firstShard = meta.siblings.find(
-    (s) => /\.safetensors$/.test(s.rfilename) && /-00001-of-/.test(s.rfilename)
-  );
-  if (firstShard) return { engine: "vllm", file: firstShard.rfilename };
-  const anyST = pickFile(meta.siblings, ".safetensors");
-  if (anyST) return { engine: "vllm", file: anyST };
-
-  fatal("No .gguf or .safetensors file found in repo");
-}
-
-function slugifyName(repo: string): string {
-  return repo
-    .toLowerCase()
-    .replace(/[^a-z0-9]+/g, "-")
-    .replace(/(^-|-$)/g, "");
-}
-
-function buildDisplayName(meta: HFModelMeta, repo: string): string {
-  // Try to use the model ID as display name, fallback to repo name
-  if (meta.id) {
-    return meta.id;
-  }
-  return repo;
-}
-
-function buildLabels(meta: HFModelMeta, owner: string, repo: string): Record<string, string> {
-  const labels: Record<string, string> = {};
-
-  // Priority 1: Use thumbnail from cardData if available
-  if (meta.cardData?.thumbnail) {
-    labels.icon_url = meta.cardData.thumbnail;
-  } else {
-    // Priority 2: Use HuggingFace social thumbnail for the organization/user
-    // This provides high-quality avatars for HF organizations
-    labels.icon_url = `https://cdn-thumbnails.huggingface.co/social-thumbnails/${owner}.png`;
-  }
-
-  // Add original HuggingFace repo URL for traceability
-  labels.hf_repo_url = `https://huggingface.co/${owner}/${repo}`;
-
-  return labels;
-}
-
-function buildCatalog(
-  { owner, repo }: { owner: string; repo: string },
-  meta: HFModelMeta
-) {
-  const { engine, file } = selectPrimaryFile(meta);
-  const task = mapHFPipelineToTask(meta.pipeline_tag);
-
-  // metadata.name uses repo slug; workspace omitted
-  const name = slugifyName(repo);
-  const displayName = buildDisplayName(meta, repo);
-  const labels = buildLabels(meta, owner, repo);
-
-  const catalog: Record<string, unknown> = {
-    apiVersion: "v1",
-    kind: "ModelCatalog",
-    metadata: {
-      name,
-      display_name: displayName,
-      // workspace intentionally left blank for UI to fill
-      labels,
-    },
-    spec: {
-      model: {
-        registry: "",
-        name: `${owner}/${repo}`,
-        file,
-        version: "latest",
-        task: task,
-      },
-      engine: {
-        engine,
-        version: "v1",
-      },
-      resources: {},
-      replicas: { num: 1 },
-      deployment_options: {
-        scheduler: DEFAULT_SCHEDULER,
-      },
-      variables: {
-        RAY_SCHEDULER_TYPE: DEFAULT_SCHEDULER.type,
-        ...(engine === "vllm"
-          ? {
-              engine_args: {
-                ...DEFAULT_VLLM_ARGS,
-                served_model_name: `${owner}/${repo}`,
-              },
-            }
-          : {}),
-      },
-    },
-  };
-
-  return catalog;
-}
-
-// -----------------------------
-// Main
-// -----------------------------
 async function main() {
   const {
     _: [repoUrl],
@@ -245,18 +20,12 @@ async function main() {
     alias: { j: "json" },
   });
 
-  if (!repoUrl || typeof repoUrl !== "string")
-    fatal("Please provide a Hugging Face repo URL.");
-
-  const { owner, repo } = parseRepoUrl(repoUrl);
-  const meta = await fetchModelMeta(owner, repo);
-  const catalog = buildCatalog({ owner, repo }, meta);
-
-  if (jsonFlag) {
-    console.log(JSON.stringify(catalog, null, 2));
-  } else {
-    console.log(yaml.stringify(catalog));
-  }
+  console.log(
+    await hf2catalog({
+      repoUrl: String(repoUrl),
+      output: jsonFlag ? "json" : "yaml",
+    })
+  );
 }
 
 if (import.meta.main) main();