Commit10085e4

committed

feat: ability to pick custom model

1 parentf342aee commit10085e4Copy full SHA for 10085e4

File tree

6 files changed

+129

-51

lines changed

package.json
src
- config.ts
- prompts
  - autocomplete.ts
  - preparePrompt.ts
  - processors
    - models.ts
  - provider.ts

6 files changed

+129

-51

lines changed

`‎package.json‎`

Lines changed: 42 additions & 20 deletions

Original file line number	Diff line number	Diff line change
`@@ -38,23 +38,9 @@`
`38`	`38`	`"properties": {`
`39`	`39`	`"inference.endpoint": {`
`40`	`40`	`"type":"string",`
`41`		`-"default":"http://127.0.0.1:11434/",`
`42`		`-"description":"Ollama Server Endpoint"`
`43`		`- },`
`44`		`-"inference.maxLines": {`
`45`		`-"type":"number",`
`46`		`-"default":16,`
`47`		`-"description":"Max number of lines to be keep."`
`48`		`- },`
`49`		`-"inference.maxTokens": {`
`50`		`-"type":"number",`
`51`		`-"default":256,`
`52`		`-"description":"Max number of new tokens to be generated."`
`53`		`- },`
`54`		`-"inference.temperature": {`
`55`		`-"type":"number",`
`56`		`-"default":0.2,`
`57`		`-"description":"Temperature of the model. Increasing the temperature will make the model answer more creatively."`
	`41`	`+"default":"",`
	`42`	`+"description":"Ollama Server Endpoint. Empty for local instance.",`
	`43`	`+"order":1`
`58`	`44`	`},`
`59`	`45`	`"inference.model": {`
`60`	`46`	`"type":"string",`
`@@ -81,10 +67,46 @@`
`81`	`67`	`"deepseek-coder:6.7b-base-fp16",`
`82`	`68`	`"deepseek-coder:33b-base-q4_K_S",`
`83`	`69`	`"deepseek-coder:33b-base-q4_K_M",`
`84`		`-"deepseek-coder:33b-base-fp16"`
	`70`	`+"deepseek-coder:33b-base-fp16",`
	`71`	`+"custom"`
`85`	`72`	`],`
`86`	`73`	`"default":"deepseek-coder:1.3b-base-q4_1",`
`87`		`-"description":"Inference model to use"`
	`74`	`+"description":"Inference model to use",`
	`75`	`+"order":2`
	`76`	`+ },`
	`77`	`+"inference.temperature": {`
	`78`	`+"type":"number",`
	`79`	`+"default":0.2,`
	`80`	`+"description":"Temperature of the model. Increasing the temperature will make the model answer more creatively.",`
	`81`	`+"order":3`
	`82`	`+ },`
	`83`	`+"inference.custom.model": {`
	`84`	`+"type":"string",`
	`85`	`+"default":"",`
	`86`	`+"description":"Custom model name",`
	`87`	`+"order":4`
	`88`	`+ },`
	`89`	`+"inference.custom.format": {`
	`90`	`+"type":"string",`
	`91`	`+"enum": [`
	`92`	`+"codellama",`
	`93`	`+"deepseek"`
	`94`	`+ ],`
	`95`	`+"default":"codellama",`
	`96`	`+"description":"Custom model prompt format",`
	`97`	`+"order":5`
	`98`	`+ },`
	`99`	`+"inference.maxLines": {`
	`100`	`+"type":"number",`
	`101`	`+"default":16,`
	`102`	`+"description":"Max number of lines to be keep.",`
	`103`	`+"order":6`
	`104`	`+ },`
	`105`	`+"inference.maxTokens": {`
	`106`	`+"type":"number",`
	`107`	`+"default":256,`
	`108`	`+"description":"Max number of new tokens to be generated.",`
	`109`	`+"order":7`
`88`	`110`	`}`
`89`	`111`	`}`
`90`	`112`	`}`
`@@ -111,4 +133,4 @@`
`111`	`133`	`"ts-jest":"^29.1.1",`
`112`	`134`	`"typescript":"^5.2.2"`
`113`	`135`	`}`
`114`		`-}`
	`136`	`+}`

`‎src/config.ts‎`

Lines changed: 50 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,50 @@`
	`1`	`+importvscodefrom'vscode';`
	`2`	`+`
	`3`	`+classConfig{`
	`4`	`+`
	`5`	`+// Inference`
	`6`	`+getinference(){`
	`7`	`+letconfig=this.#config;`
	`8`	`+`
	`9`	`+// Load endpoint`
	`10`	`+letendpoint=(config.get('endpoint')asstring).trim();`
	`11`	`+if(endpoint.endsWith('/')){`
	`12`	`+endpoint=endpoint.slice(0,endpoint.length-1).trim();`
	`13`	`+}`
	`14`	`+if(endpoint===''){`
	`15`	`+endpoint='http://127.0.0.1:11434';`
	`16`	`+}`
	`17`	`+`
	`18`	`+// Load general paremeters`
	`19`	`+letmaxLines=config.get('maxLines')asnumber;`
	`20`	`+letmaxTokens=config.get('maxTokens')asnumber;`
	`21`	`+lettemperature=config.get('temperature')asnumber;`
	`22`	`+`
	`23`	`+// Load model`
	`24`	`+letmodelName=config.get('model')asstring;`
	`25`	`+letmodelFormat:'codellama'\|'deepseek'='codellama';`
	`26`	`+if(modelName==='custom'){`
	`27`	`+modelName=config.get('custom.model')asstring;`
	`28`	`+modelFormat=config.get('cutom.format')as'codellama'\|'deepseek';`
	`29`	`+}else{`
	`30`	`+if(modelName.startsWith('deepseek-coder')){`
	`31`	`+modelFormat='deepseek';`
	`32`	`+}`
	`33`	`+}`
	`34`	`+`
	`35`	`+return{`
	`36`	`+ endpoint,`
	`37`	`+ maxLines,`
	`38`	`+ maxTokens,`
	`39`	`+ temperature,`
	`40`	`+ modelName,`
	`41`	`+ modelFormat`
	`42`	`+};`
	`43`	`+}`
	`44`	`+`
	`45`	`+get #config(){`
	`46`	`+returnvscode.workspace.getConfiguration('inference');`
	`47`	`+};`
	`48`	`+}`
	`49`	`+`
	`50`	`+exportconstconfig=newConfig();`

`‎src/prompts/autocomplete.ts‎`

Lines changed: 4 additions & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,20 +1,21 @@`
`1`	`1`	`import{ollamaTokenGenerator}from'../modules/ollamaTokenGenerator';`
`2`	`2`	`import{countSymbol}from'../modules/text';`
`3`	`3`	`import{info}from'../modules/log';`
`4`		`-import{adaptPrompt}from'./adaptors/adaptPrompt';`
	`4`	`+import{ModelFormat,adaptPrompt}from'./processors/models';`
`5`	`5`
`6`	`6`	`exportasyncfunctionautocomplete(args:{`
`7`	`7`	`endpoint:string,`
`8`	`8`	`model:string,`
	`9`	`+format:ModelFormat,`
`9`	`10`	`prefix:string,`
`10`		`-suffix:string\|null,`
	`11`	`+suffix:string,`
`11`	`12`	`maxLines:number,`
`12`	`13`	`maxTokens:number,`
`13`	`14`	`temperature:number,`
`14`	`15`	`canceled?:()=>boolean,`
`15`	`16`	`}):Promise<string>{`
`16`	`17`
`17`		`-letprompt=adaptPrompt({prefix:args.prefix,suffix:args.suffix,model:args.model});`
	`18`	`+letprompt=adaptPrompt({prefix:args.prefix,suffix:args.suffix,format:args.format});`
`18`	`19`
`19`	`20`	`// Calculate arguments`
`20`	`21`	`letdata={`

`‎src/prompts/preparePrompt.ts‎`

Lines changed: 4 additions & 4 deletions

Original file line number	Diff line number	Diff line change
`@@ -9,14 +9,14 @@ export async function preparePrompt(document: vscode.TextDocument, position: vsc`
`9`	`9`	`lettext=document.getText();`
`10`	`10`	`letoffset=document.offsetAt(position);`
`11`	`11`	`letprefix=text.slice(0,offset);`
`12`		`-letsuffix:string\|null=text.slice(offset);`
	`12`	`+letsuffix:string=text.slice(offset);`
`13`	`13`
`14`	`14`	`// Trim suffix`
`15`	`15`	`// If suffix is too small it is safe to assume that it could be ignored which would allow us to use`
`16`	`16`	`// more powerful completition instead of in middle one`
`17`		`-if(suffix.length<256){`
`18`		`-suffix=null;`
`19`		`-}`
	`17`	`+//if (suffix.length < 256) {`
	`18`	`+// suffix = null;`
	`19`	`+//}`
`20`	`20`
`21`	`21`	`// Add filename and language to prefix`
`22`	`22`	`// NOTE: Most networks don't have a concept of filenames and expected language, but we expect that some files in training set has something in title that`

`‎src/prompts/adaptors/adaptPrompt.ts‎renamed to ‎src/prompts/processors/models.ts‎`

Lines changed: 10 additions & 8 deletions

Original file line number	Diff line number	Diff line change
`@@ -1,15 +1,17 @@`
`1`		`-exportfunctionadaptPrompt(args:{model:string,prefix:string,suffix:string\|null}):{prompt:string,stop:string[]}{`
	`1`	`+exporttypeModelFormat='codellama'\|'deepseek';`
	`2`	`+`
	`3`	`+exportfunctionadaptPrompt(args:{format:ModelFormat,prefix:string,suffix:string}):{prompt:string,stop:string[]}{`
`2`	`4`
`3`	`5`	`// Common non FIM mode`
`4`		`-if(!args.suffix){`
`5`		`-return{`
`6`		`-prompt:args.prefix,`
`7`		-stop:[`<END>`]
`8`		`-};`
`9`		`-}`
	`6`	`+//if (!args.suffix) {`
	`7`	`+// return {`
	`8`	`+// prompt: args.prefix,`
	`9`	+// stop: [`<END>`]
	`10`	`+// };`
	`11`	`+//}`
`10`	`12`
`11`	`13`	`// Starcoder FIM`
`12`		`-if(args.model.startsWith('deepseek-coder')){`
	`14`	`+if(args.format==='deepseek'){`
`13`	`15`	`return{`
`14`	`16`	prompt:`<｜fim▁begin｜>${args.prefix}<｜fim▁hole｜>${args.suffix}<｜fim▁end｜>`,
`15`	`17`	stop:[`<｜fim▁begin｜>`,`<｜fim▁hole｜>`,`<｜fim▁end｜>`,`<END>`]

`‎src/prompts/provider.ts‎`

Lines changed: 19 additions & 16 deletions

Original file line number	Diff line number	Diff line change
`@@ -7,6 +7,7 @@ import { getFromPromptCache, setPromptToCache } from './promptCache';`
`7`	`7`	`import{isNotNeeded,isSupported}from'./filter';`
`8`	`8`	`import{ollamaCheckModel}from'../modules/ollamaCheckModel';`
`9`	`9`	`import{ollamaDownloadModel}from'../modules/ollamaDownloadModel';`
	`10`	`+import{config}from'../config';`
`10`	`11`
`11`	`12`	`exportclassPromptProviderimplementsvscode.InlineCompletionItemProvider{`
`12`	`13`
`@@ -62,22 +63,23 @@ export class PromptProvider implements vscode.InlineCompletionItemProvider {`
`62`	`63`	`if(cached===undefined){`
`63`	`64`
`64`	`65`	`// Config`
`65`		`-letconfig=vscode.workspace.getConfiguration('inference');`
`66`		`-letendpoint=config.get('endpoint')asstring;`
`67`		`-letmodel=config.get('model')asstring;`
`68`		`-letmaxLines=config.get('maxLines')asnumber;`
`69`		`-letmaxTokens=config.get('maxTokens')asnumber;`
`70`		`-lettemperature=config.get('temperature')asnumber;`
`71`		`-if(endpoint.endsWith('/')){`
`72`		`-endpoint=endpoint.slice(0,endpoint.length-1);`
`73`		`-}`
	`66`	`+letinferenceConfig=config.inference;`
	`67`	`+// let config = vscode.workspace.getConfiguration('inference');`
	`68`	`+// let endpoint = config.get('endpoint') as string;`
	`69`	`+// let model = config.get('model') as string;`
	`70`	`+// let maxLines = config.get('maxLines') as number;`
	`71`	`+// let maxTokens = config.get('maxTokens') as number;`
	`72`	`+// let temperature = config.get('temperature') as number;`
	`73`	`+// if (endpoint.endsWith('/')) {`
	`74`	`+// endpoint = endpoint.slice(0, endpoint.length - 1);`
	`75`	`+// }`
`74`	`76`
`75`	`77`	`// Update status`
`76`	`78`	this.statusbar.text=`$(sync~spin) Llama Coder`;
`77`	`79`	`try{`
`78`	`80`
`79`	`81`	`// Check model exists`
`80`		`-letmodelExists=awaitollamaCheckModel(endpoint,model);`
	`82`	`+letmodelExists=awaitollamaCheckModel(inferenceConfig.endpoint,inferenceConfig.modelName);`
`81`	`83`	`if(token.isCancellationRequested){`
`82`	`84`	info(`Canceled after AI completion.`);
`83`	`85`	`return;`
`@@ -86,7 +88,7 @@ export class PromptProvider implements vscode.InlineCompletionItemProvider {`
`86`	`88`	`// Download model if not exists`
`87`	`89`	`if(!modelExists){`
`88`	`90`	this.statusbar.text=`$(sync~spin) Downloading`;
`89`		`-awaitollamaDownloadModel(endpoint,model);`
	`91`	`+awaitollamaDownloadModel(inferenceConfig.endpoint,inferenceConfig.modelName);`
`90`	`92`	this.statusbar.text=`$(sync~spin) Llama Coder`;
`91`	`93`	`}`
`92`	`94`	`if(token.isCancellationRequested){`
`@@ -99,11 +101,12 @@ export class PromptProvider implements vscode.InlineCompletionItemProvider {`
`99`	`101`	`res=awaitautocomplete({`
`100`	`102`	`prefix:prepared.prefix,`
`101`	`103`	`suffix:prepared.suffix,`
`102`		`-endpoint:endpoint,`
`103`		`-model:model,`
`104`		`-maxLines:maxLines,`
`105`		`-maxTokens:maxTokens,`
`106`		`- temperature,`
	`104`	`+endpoint:inferenceConfig.endpoint,`
	`105`	`+model:inferenceConfig.modelName,`
	`106`	`+format:inferenceConfig.modelFormat,`
	`107`	`+maxLines:inferenceConfig.maxLines,`
	`108`	`+maxTokens:inferenceConfig.maxTokens,`
	`109`	`+temperature:inferenceConfig.temperature,`
`107`	`110`	`canceled:()=>token.isCancellationRequested,`
`108`	`111`	`});`
`109`	`112`	info(`AI completion completed:${res}`);

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit10085e4

File tree

6 files changed

6 files changed

`‎package.json‎`

`‎src/config.ts‎`

`‎src/prompts/autocomplete.ts‎`

`‎src/prompts/preparePrompt.ts‎`

`‎src/prompts/adaptors/adaptPrompt.ts‎renamed to ‎src/prompts/processors/models.ts‎`

`‎src/prompts/provider.ts‎`

0 commit comments