ex3ndr
diff --git a/‎CHANGELOG.md
Lines changed: 0 additions & 13 deletions b/‎CHANGELOG.md
Lines changed: 0 additions & 13 deletions
diff --git a/‎README.md
Lines changed: 16 additions & 2 deletions b/‎README.md
Lines changed: 16 additions & 2 deletions
diff --git a/‎jest.config.js
Lines changed: 7 additions & 0 deletions b/‎jest.config.js
Lines changed: 7 additions & 0 deletions
diff --git a/‎jest.setup.js
Lines changed: 1 addition & 0 deletions b/‎jest.setup.js
Lines changed: 1 addition & 0 deletions
diff --git a/‎package.json
Lines changed: 9 additions & 9 deletions b/‎package.json
Lines changed: 9 additions & 9 deletions
diff --git a/‎src/prompts/adaptors/adaptPrompt.ts
Lines changed: 11 additions & 11 deletions b/‎src/prompts/adaptors/adaptPrompt.ts
Lines changed: 11 additions & 11 deletions
diff --git a/‎src/prompts/autocomplete.ts
Lines changed: 1 addition & 1 deletion b/‎src/prompts/autocomplete.ts
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/prompts/preparePrompt.ts
Lines changed: 13 additions & 12 deletions b/‎src/prompts/preparePrompt.ts
Lines changed: 13 additions & 12 deletions
diff --git a/‎src/prompts/processors/comment.ts
Lines changed: 12 additions & 0 deletions b/‎src/prompts/processors/comment.ts
Lines changed: 12 additions & 0 deletions
diff --git a/‎src/prompts/processors/detectLanguage.spec.ts
Lines changed: 7 additions & 0 deletions b/‎src/prompts/processors/detectLanguage.spec.ts
Lines changed: 7 additions & 0 deletions
@@ -42,6 +42,20 @@ Currently Llama Coder supports only Codellama. Model is quantized in different w
 * m - slow on MacOS
 * g - slow on older NVidia cards (pre 30xx)
 
-## License
+## Changelog
 
-MIT
+## [0.0.8]
+- Improved DeepSeek support and language detection
+
+## [0.0.7]
+- Added DeepSeek support
+- Ability to change temperature and top p
+- Fixed some bugs
+
+## [0.0.6]
+- Fix ollama links
+- Added more models
+
+## [0.0.4]
+
+- Initial release of Llama Coder
@@ -0,0 +1,7 @@
+/** @type {import('ts-jest/dist/types').InitialOptionsTsJest} */
+module.exports = {
+  preset: 'ts-jest',
+  testEnvironment: 'node',
+  testPathIgnorePatterns: ["/node_modules/","/out/"],
+  setupFiles: ['./jest.setup.js']
+};
@@ -0,0 +1 @@
+require('dotenv').config();
@@ -2,7 +2,7 @@
   "name": "llama-coder",
   "displayName": "Llama Coder",
   "description": "Better and self-hosted Github Copilot replacement",
-  "version": "0.0.7",
+  "version": "0.0.8",
   "icon": "icon.png",
   "publisher": "ex3ndr",
   "repository": {
@@ -93,19 +93,19 @@
     "watch": "tsc -watch -p ./",
     "pretest": "yarn run compile && yarn run lint",
     "lint": "eslint src --ext ts",
-    "test": "node ./out/test/runTest.js",
+    "test": "jest",
     "package": "vsce package"
   },
   "devDependencies": {
-    "@types/vscode": "^1.84.0",
-    "@types/mocha": "^10.0.3",
+    "@types/jest": "^29.5.10",
     "@types/node": "18.x",
+    "@types/vscode": "^1.84.0",
     "@typescript-eslint/eslint-plugin": "^6.9.0",
     "@typescript-eslint/parser": "^6.9.0",
+    "dotenv": "^16.3.1",
     "eslint": "^8.52.0",
-    "glob": "^10.3.10",
-    "mocha": "^10.2.0",
-    "typescript": "^5.2.2",
-    "@vscode/test-electron": "^2.3.6"
+    "jest": "^29.7.0",
+    "ts-jest": "^29.1.1",
+    "typescript": "^5.2.2"
   }
-}
+}
@@ -1,22 +1,22 @@
-export function adaptPrompt(args: { model: string, prefix: string, suffix: string }): { prompt: string, stop: string[] } {
+export function adaptPrompt(args: { model: string, prefix: string, suffix: string | null }): { prompt: string, stop: string[] } {
 
-    // Starcoder format
-    if (args.model.startsWith('deepseek-coder')) {
-
-        if (args.suffix.length < 1000) {
-            return {
-                prompt: args.prefix,
-                stop: [`<END>`]
-            };
-        }
+    // Common non FIM mode
+    if (!args.suffix) {
+        return {
+            prompt: args.prefix,
+            stop: [`<END>`]
+        };
+    }
 
+    // Starcoder FIM
+    if (args.model.startsWith('deepseek-coder')) {
         return {
             prompt: `<｜fim▁begin｜>${args.prefix}<｜fim▁hole｜>${args.suffix}<｜fim▁end｜>`,
             stop: [`<｜fim▁begin｜>`, `<｜fim▁hole｜>`, `<｜fim▁end｜>`, `<END>`]
         };
     }
 
-    // Codellama format
+    // Codellama FIM
     return {
         prompt: `<PRE> ${args.prefix} <SUF>${args.suffix} <MID>`,
         stop: [`<PRE>`, `<SUF>`, `<MID>`, `<END>`]
 
@@ -7,7 +7,7 @@ export async function autocomplete(args: {
     endpoint: string,
     model: string,
     prefix: string,
-    suffix: string,
+    suffix: string | null,
     maxLines: number,
     maxTokens: number,
     temperature: number,
 
@@ -1,30 +1,31 @@
 import vscode from 'vscode';
-import path from 'path';
+import { detectLanguage } from './processors/detectLanguage';
+import { fileHeaders } from './processors/fileHeaders';
+import { languages } from './processors/languages';
 
 export async function preparePrompt(document: vscode.TextDocument, position: vscode.Position, context: vscode.InlineCompletionContext) {
 
     // Load document text
     let text = document.getText();
     let offset = document.offsetAt(position);
     let prefix = text.slice(0, offset);
-    let suffix = text.slice(offset);
+    let suffix: string | null = text.slice(offset);
 
     // Trim suffix
-    // NOTE: It seems that most neural networks are built have a focus on last characters and we therefore need to trim them to not get weird results.
-    // TODO: Better solution?
-    // TODO: Am i right here? What if we would want to generate something that uses something in the end of the file?
-    if (suffix.length > 256) {
-        suffix = suffix.slice(0, 256);
+    // If suffix is too small it is safe to assume that it could be ignored which would allow us to use
+    // more powerful completition instead of in middle one
+    if (suffix.length < 256) {
+        suffix = null;
     }
 
     // Add filename and language to prefix
     // NOTE: Most networks don't have a concept of filenames and expected language, but we expect that some files in training set has something in title that 
     //       would indicate filename and language
-    // NOTE: We are building for typescript for now so we can use C-style comments to indicate filename
-    let filename = path.basename(document.fileName);
-    let language = document.languageId;
-    let filenamePrefix = `/* ${language}, filename: ${filename} */`;
-    prefix = filenamePrefix + '\n' + prefix;
+    // NOTE: If we can't detect language, we could ignore this since the number of languages that need detection is limited
+    let language = detectLanguage(document.uri.fsPath, document.languageId);
+    if (language) {
+        prefix = fileHeaders(prefix, document.uri.fsPath, languages[language]);
+    }
 
     return {
         prefix,
 
@@ -0,0 +1,12 @@
+import { LanguageDescriptor } from "./languages";
+
+export function comment(text: string, language: LanguageDescriptor): string | null {
+    if (language.comment) {
+        if (language.comment.end) {
+            return `${language.comment.start} ${text} ${language.comment.end}`;
+        } else {
+            return `${language.comment.start} ${text}`;
+        }
+    }
+    return null;
+}
@@ -0,0 +1,7 @@
+import { detectLanguage } from './detectLanguage';
+
+describe('detectLanguage', () => {
+    it('should detect language from happy path', () => {
+        
+    });
+});