jasonhp
diff --git a/‎.github/workflows/ollama-template-update.yml‎
Lines changed: 108 additions & 0 deletions b/‎.github/workflows/ollama-template-update.yml‎
Lines changed: 108 additions & 0 deletions
diff --git a/‎.github/workflows/ollama-utils-publish.yml‎
Lines changed: 68 additions & 0 deletions b/‎.github/workflows/ollama-utils-publish.yml‎
Lines changed: 68 additions & 0 deletions
diff --git a/‎.github/workflows/test.yml‎
Lines changed: 0 additions & 21 deletions b/‎.github/workflows/test.yml‎
Lines changed: 0 additions & 21 deletions
diff --git a/‎CODEOWNERS‎
Lines changed: 5 additions & 0 deletions b/‎CODEOWNERS‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 7 additions & 7 deletions b/‎README.md‎
Lines changed: 7 additions & 7 deletions
diff --git a/‎e2e/ts/tsconfig.json‎
Lines changed: 1 addition & 1 deletion b/‎e2e/ts/tsconfig.json‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/gguf/README.md‎
Lines changed: 46 additions & 0 deletions b/‎packages/gguf/README.md‎
Lines changed: 46 additions & 0 deletions
diff --git a/‎packages/gguf/package.json‎
Lines changed: 6 additions & 2 deletions b/‎packages/gguf/package.json‎
Lines changed: 6 additions & 2 deletions
@@ -0,0 +1,108 @@
+name: Ollama template update
+on:
+  # push: # for debugging
+  workflow_dispatch:
+  schedule:
+    - cron: "0 7 * * 1" # every monday at 7am, so I'll review it after having a 🥐
+
+permissions:
+  pull-requests: write # for creating PR
+  issues: write # for adding labels to the created PR
+  contents: write # for git push new branch
+
+jobs:
+  update-ollama-templates:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+        if: github.repository == 'huggingface/huggingface.js'
+
+      - name: Prepare
+        id: prepare
+        if: github.repository == 'huggingface/huggingface.js'
+        shell: bash
+        run: |
+          git config --global user.name machineuser
+          git config --global user.email [email protected]
+          git config --global --add safe.directory "$GITHUB_WORKSPACE"
+          npm install -g pnpm
+          CURRENT_DATE=$(date -u +"%Y-%m-%d")
+          echo "CURRENT_DATE=$CURRENT_DATE"
+          echo "CURRENT_DATE=$CURRENT_DATE" >> $GITHUB_OUTPUT
+
+      - name: Install dependencies
+        if: github.repository == 'huggingface/huggingface.js'
+        shell: bash
+        run: |
+          cd packages/ollama-utils
+          pnpm install --frozen-lockfile
+
+      - name: Run update script
+        if: github.repository == 'huggingface/huggingface.js'
+        shell: bash
+        run: |
+          cd packages/ollama-utils
+          pnpm run build:automap
+
+      - name: Check for changed files
+        id: changes
+        if: github.repository == 'huggingface/huggingface.js'
+        shell: bash
+        env:
+          CURRENT_DATE: ${{ steps.prepare.outputs.CURRENT_DATE }}
+        run: |
+          set -x
+
+          FILE_TO_ADD="packages/ollama-utils/src/chat-template-automap.ts"
+
+          git status
+          modified_files="$(git status -s)"
+          echo "Modified files: ${modified_files}"
+          if [ -n "${modified_files}" ]; then
+            NEW_BRANCH="ollama-${CURRENT_DATE}"
+            echo "NEW_BRANCH=${NEW_BRANCH}"
+            echo "Changes detected, will create a new branch:"
+            echo "${modified_files}"
+            git add "${FILE_TO_ADD}"
+            git commit -m "ollama update ${CURRENT_DATE}"
+            git checkout -b "${NEW_BRANCH}"
+            git push -f origin "${NEW_BRANCH}"
+            echo "HAS_CHANGES=true" >> $GITHUB_OUTPUT
+            echo "NEW_BRANCH=${NEW_BRANCH}" >> $GITHUB_OUTPUT
+          else
+            echo "No files changed, skipping..."
+            echo "HAS_CHANGES=false" >> $GITHUB_OUTPUT
+          fi
+
+      - name: Create PR
+        if: steps.changes.outputs.HAS_CHANGES == 'true' && github.repository == 'huggingface/huggingface.js'
+        uses: actions/github-script@v6
+        env:
+          CURRENT_DATE: ${{ steps.prepare.outputs.CURRENT_DATE }}
+          NEW_BRANCH: ${{ steps.changes.outputs.NEW_BRANCH }}
+        with:
+          github-token: ${{ secrets.HUGGINGFACE_JS_AUTOMATIC_PR }}
+          script: |
+            const { repo, owner } = context.repo;
+            const currDate = process.env.CURRENT_DATE;
+            const newBranch = process.env.NEW_BRANCH;
+
+            const result = await github.rest.pulls.create({
+              title: '[ollama-utils] 🤖 Auto-update chat templates (' + currDate + ')',
+              owner,
+              repo,
+              head: newBranch,
+              base: 'main',
+              body: [
+                'This PR is auto-generated by',
+                '[generate-automap.ts](https://github.com/huggingface/huggingface.js/blob/main/packages/ollama-utils/scripts/generate-automap.ts).'
+              ].join('\n')
+            });
+
+            console.log({ result });
+            // github.rest.issues.addLabels({
+            //   owner,
+            //   repo,
+            //   issue_number: result.data.number,
+            //   labels: ['feature', 'automated pr']
+            // });
@@ -0,0 +1,68 @@
+name: Ollama Utils - Version and Release
+
+on:
+  workflow_dispatch:
+    inputs:
+      newversion:
+        type: choice
+        description: "Semantic Version Bump Type"
+        default: patch
+        options:
+          - patch
+          - minor
+          - major
+
+concurrency:
+  group: "push-to-main"
+
+defaults:
+  run:
+    working-directory: packages/ollama-utils
+
+jobs:
+  version_and_release:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+        with:
+          # Needed to push the tag and the commit on the main branch, otherwise we get:
+          # > Run git push --follow-tags
+          # remote: error: GH006: Protected branch update failed for refs/heads/main.
+          # remote: error: Changes must be made through a pull request. Required status check "lint" is expected.
+          token: ${{ secrets.BOT_ACCESS_TOKEN }}
+      - run: npm install -g corepack@latest && corepack enable
+      - uses: actions/setup-node@v3
+        with:
+          node-version: "20"
+          cache: "pnpm"
+          cache-dependency-path: |
+            packages/ollama-utils/pnpm-lock.yaml
+          # setting a registry enables the NODE_AUTH_TOKEN env variable where we can set an npm token.  REQUIRED
+          registry-url: "https://registry.npmjs.org"
+      - run: pnpm install
+      - run: git config --global user.name machineuser
+      - run: git config --global user.email [email protected]
+      - run: |
+          PACKAGE_VERSION=$(node -p "require('./package.json').version")
+          BUMPED_VERSION=$(node -p "require('semver').inc('$PACKAGE_VERSION', '${{ github.event.inputs.newversion }}')")
+          # Update package.json with the new version
+          node -e "const fs = require('fs'); const package = JSON.parse(fs.readFileSync('./package.json')); package.version = '$BUMPED_VERSION'; fs.writeFileSync('./package.json', JSON.stringify(package, null, '\t') + '\n');"
+          git commit . -m "🔖 @huggingface/ollama-utils $BUMPED_VERSION"
+          git tag "ollama-utils-v$BUMPED_VERSION"
+
+      - name: "Check Deps are published before publishing this package"
+        run: pnpm -w check-deps tasks
+
+      - run: pnpm publish --no-git-checks .
+        env:
+          NODE_AUTH_TOKEN: ${{ secrets.NPM_TOKEN }}
+      - run: git pull --rebase && git push --follow-tags
+      # hack - reuse actions/setup-node@v3 just to set a new registry
+      - uses: actions/setup-node@v3
+        with:
+          node-version: "20"
+          registry-url: "https://npm.pkg.github.com"
+      # Disable for now, until github supports PATs for writing github packages (https://github.com/github/roadmap/issues/558)
+      # - run: pnpm publish --no-git-checks .
+      #   env:
+      #     NODE_AUTH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
@@ -41,13 +41,6 @@ jobs:
         run: VCR_MODE=playback pnpm --filter ...[${{ steps.since.outputs.SINCE }}] test
         env:
           HF_TOKEN: ${{ secrets.HF_TOKEN }}
-          HF_FAL_KEY: dummy
-          HF_NEBIUS_KEY: dummy
-          HF_REPLICATE_KEY: dummy
-          HF_SAMBANOVA_KEY: dummy
-          HF_TOGETHER_KEY: dummy
-          HF_NOVITA_KEY: dummy
-          HF_FIREWORKS_KEY: dummy
 
   browser:
     runs-on: ubuntu-latest
@@ -84,13 +77,6 @@ jobs:
         run: VCR_MODE=playback pnpm --filter ...[${{ steps.since.outputs.SINCE }}] test:browser
         env:
           HF_TOKEN: ${{ secrets.HF_TOKEN }}
-          HF_FAL_KEY: dummy
-          HF_NEBIUS_KEY: dummy
-          HF_REPLICATE_KEY: dummy
-          HF_SAMBANOVA_KEY: dummy
-          HF_TOGETHER_KEY: dummy
-          HF_NOVITA_KEY: dummy
-          HF_FIREWORKS_KEY: dummy
 
   e2e:
     runs-on: ubuntu-latest
@@ -154,10 +140,3 @@ jobs:
         env:
           NPM_CONFIG_REGISTRY: http://localhost:4874/
           HF_TOKEN: ${{ secrets.HF_TOKEN }}
-          HF_FAL_KEY: dummy
-          HF_NEBIUS_KEY: dummy
-          HF_REPLICATE_KEY: dummy
-          HF_SAMBANOVA_KEY: dummy
-          HF_TOGETHER_KEY: dummy
-          HF_NOVITA_KEY: dummy
-          HF_FIREWORKS_KEY: dummy
@@ -23,4 +23,9 @@
 /packages/gguf @mishig25 @ngxson @julien-c
 
 # Ownership for the space-header Package
+
 /packages/space-header @enzostvs
+
+# Ownership for the ollama-utils Package
+
+/packages/ollama-utils @ngxson
@@ -23,7 +23,7 @@ await uploadFile({
   // Can work with native File in browsers
   file: {
     path: "pytorch_model.bin",
-    content: new Blob(...) 
+    content: new Blob(...)
   }
 });
 
@@ -39,7 +39,7 @@ await inference.chatCompletion({
   ],
   max_tokens: 512,
   temperature: 0.5,
-  provider: "sambanova", // or together, fal-ai, replicate, …
+  provider: "sambanova", // or together, fal-ai, replicate, cohere …
 });
 
 await inference.textToImage({
@@ -96,7 +96,7 @@ You can run our packages with vanilla JS, without any bundler, by using a CDN or
 
 ```html
 <script type="module">
-    import { HfInference } from 'https://cdn.jsdelivr.net/npm/@huggingface/inference@3.3.3/+esm';
+    import { HfInference } from 'https://cdn.jsdelivr.net/npm/@huggingface/inference@3.5.1/+esm';
     import { createRepo, commit, deleteRepo, listFiles } from "https://cdn.jsdelivr.net/npm/@huggingface/[email protected]/+esm";
 </script>
 ```
@@ -146,12 +146,12 @@ for await (const chunk of inference.chatCompletionStream({
   console.log(chunk.choices[0].delta.content);
 }
 
-/// Using a third-party provider: 
+/// Using a third-party provider:
 await inference.chatCompletion({
   model: "meta-llama/Llama-3.1-8B-Instruct",
   messages: [{ role: "user", content: "Hello, nice to meet you!" }],
   max_tokens: 512,
-  provider: "sambanova", // or together, fal-ai, replicate, …
+  provider: "sambanova", // or together, fal-ai, replicate, cohere …
 })
 
 await inference.textToImage({
@@ -211,7 +211,7 @@ await uploadFile({
   // Can work with native File in browsers
   file: {
     path: "pytorch_model.bin",
-    content: new Blob(...) 
+    content: new Blob(...)
   }
 });
 
@@ -244,7 +244,7 @@ console.log(messages); // contains the data
 
 // or you can run the code directly, however you can't check that the code is safe to execute this way, use at your own risk.
 const messages = await agent.run("Draw a picture of a cat wearing a top hat. Then caption the picture and read it out loud.")
-console.log(messages); 
+console.log(messages);
 ```
 
 There are more features of course, check each library's README!
 
@@ -1,6 +1,6 @@
 {
 	"compilerOptions": {
-		"target": "ES2015",
+		"target": "ES2022",
 		"module": "commonjs",
 		"strict": true,
 		"esModuleInterop": true,
 
@@ -96,6 +96,52 @@ In case you want to use your own GGUF metadata structure, you can disable strict
 const { metadata, tensorInfos }: GGUFParseOutput<{ strict: false }> = await gguf(URL_LLAMA);
 ```
 
+## Command line interface
+
+This package provides a CLI equivalent to [`gguf_dump.py`](https://github.com/ggml-org/llama.cpp/blob/7a2c913e66353362d7f28d612fd3c9d51a831eda/gguf-py/gguf/scripts/gguf_dump.py) script. You can dump GGUF metadata and list of tensors using this command:
+
+```bash
+npx @huggingface/gguf my_model.gguf
+
+# or, with a remote GGUF file:
+# npx @huggingface/gguf https://huggingface.co/bartowski/Llama-3.2-1B-Instruct-GGUF/resolve/main/Llama-3.2-1B-Instruct-Q4_K_M.gguf
+```
+
+Example for the output:
+
+```
+* Dumping 36 key/value pair(s)
+  Idx | Count  | Value                                                                            
+  ----|--------|----------------------------------------------------------------------------------
+    1 |      1 | version = 3                                                                      
+    2 |      1 | tensor_count = 292                                                               
+    3 |      1 | kv_count = 33                                                                    
+    4 |      1 | general.architecture = "llama"                                                   
+    5 |      1 | general.type = "model"                                                           
+    6 |      1 | general.name = "Meta Llama 3.1 8B Instruct"                                      
+    7 |      1 | general.finetune = "Instruct"                                                    
+    8 |      1 | general.basename = "Meta-Llama-3.1"                                                   
+
+[truncated]
+
+* Dumping 292 tensor(s)
+  Idx | Num Elements | Shape                          | Data Type | Name                     
+  ----|--------------|--------------------------------|-----------|--------------------------
+    1 |           64 |     64,      1,      1,      1 | F32       | rope_freqs.weight        
+    2 |    525336576 |   4096, 128256,      1,      1 | Q4_K      | token_embd.weight        
+    3 |         4096 |   4096,      1,      1,      1 | F32       | blk.0.attn_norm.weight   
+    4 |     58720256 |  14336,   4096,      1,      1 | Q6_K      | blk.0.ffn_down.weight
+
+[truncated]
+```
+
+Alternatively, you can install this package as global, which will provide the `gguf-view` command:
+
+```bash
+npm i -g @huggingface/gguf
+gguf-view my_model.gguf
+```
+
 ## Hugging Face Hub
 
 The Hub supports all file formats and has built-in features for GGUF format. 
 
@@ -1,7 +1,7 @@
 {
 	"name": "@huggingface/gguf",
 	"packageManager": "[email protected]",
-	"version": "0.1.12",
+	"version": "0.1.13",
 	"description": "a GGUF parser that works on remotely hosted files",
 	"repository": "https://github.com/huggingface/huggingface.js.git",
 	"publishConfig": {
@@ -10,6 +10,9 @@
 	"main": "./dist/index.js",
 	"module": "./dist/index.mjs",
 	"types": "./dist/index.d.ts",
+	"bin": {
+		"gguf-view": "./dist/cli.js"
+	},
 	"exports": {
 		".": {
 			"types": "./dist/index.d.ts",
@@ -18,6 +21,7 @@
 		}
 	},
 	"browser": {
+		"./src/cli.ts": false,
 		"./src/utils/FileBlob.ts": false,
 		"./dist/index.js": "./dist/browser/index.js",
 		"./dist/index.mjs": "./dist/browser/index.mjs"
@@ -32,7 +36,7 @@
 		"format": "prettier --write .",
 		"format:check": "prettier --check .",
 		"prepublishOnly": "pnpm run build",
-		"build": "tsup src/index.ts --format cjs,esm --clean && tsc --emitDeclarationOnly --declaration",
+		"build": "tsup src/index.ts src/cli.ts --format cjs,esm --clean && tsc --emitDeclarationOnly --declaration",
 		"build:llm": "tsx scripts/generate-llm.ts && pnpm run format",
 		"test": "vitest run",
 		"check": "tsc"
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"compilerOptions": {`
`3`		`- "target": "ES2015",`
	`3`	`+ "target": "ES2022",`
`4`	`4`	`"module": "commonjs",`
`5`	`5`	`"strict": true,`
`6`	`6`	`"esModuleInterop": true,`