// Original script was GPT4 but it has been deeply Ship of Theseused. import * as vscode from "vscode"; import axios from "axios"; let VSConfig: vscode.WorkspaceConfiguration; let apiEndpoint: string; let apiModel: string; let apiSystemMessage: string | undefined; let numPredict: number; let promptWindowSize: number; let rawInput: boolean | undefined; let completionKeys: string; let responsePreview: boolean | undefined; let responsePreviewMaxTokens: number; let responsePreviewDelay: number; let continueInline: boolean | undefined; function updateVSConfig() { VSConfig = vscode.workspace.getConfiguration("ollama-autocoder"); apiEndpoint = VSConfig.get("endpoint") || "http://localhost:11434/api/generate"; apiModel = VSConfig.get("model") || "openhermes2.5-mistral:7b-q4_K_M"; // The model I tested with apiSystemMessage = VSConfig.get("system message"); numPredict = VSConfig.get("max tokens predicted") || 500; promptWindowSize = VSConfig.get("prompt window size") || 2000; rawInput = VSConfig.get("raw input"); completionKeys = VSConfig.get("completion keys") || " "; responsePreview = VSConfig.get("response preview"); responsePreviewMaxTokens = VSConfig.get("preview max tokens") || 10; responsePreviewDelay = VSConfig.get("preview delay") || 0; // Must be || 0 instead of || [default] because of truthy continueInline = VSConfig.get("continue inline"); if (apiSystemMessage == "DEFAULT" || rawInput) apiSystemMessage = undefined; } updateVSConfig(); // No need for restart for any of these settings vscode.workspace.onDidChangeConfiguration(updateVSConfig); // internal function for autocomplete, not directly exposed async function autocompleteCommand(textEditor: vscode.TextEditor, cancellationToken?: vscode.CancellationToken) { const document = textEditor.document; const position = textEditor.selection.active; // Get the current prompt let prompt = document.getText(new vscode.Range(document.lineAt(0).range.start, position)); prompt = prompt.substring(Math.max(0, prompt.length - promptWindowSize), prompt.length); // Show a progress message vscode.window.withProgress( { location: vscode.ProgressLocation.Notification, title: "Ollama Autocoder", cancellable: true, }, async (progress, progressCancellationToken) => { try { progress.report({ message: "Starting model..." }); let axiosCancelPost: () => void; const axiosCancelToken = new axios.CancelToken((c) => { const cancelPost = function () { c("Autocompletion request terminated by user cancel"); }; axiosCancelPost = cancelPost; if (cancellationToken) cancellationToken.onCancellationRequested(cancelPost); progressCancellationToken.onCancellationRequested(cancelPost); vscode.workspace.onDidCloseTextDocument(cancelPost); }); // Make a request to the ollama.ai REST API const response = await axios.post(apiEndpoint, { model: apiModel, // Change this to the model you want to use prompt: prompt, stream: true, system: apiSystemMessage, raw: rawInput, options: { num_predict: numPredict } }, { cancelToken: axiosCancelToken, responseType: 'stream' } ); //tracker let oldPosition = position; let currentPosition = position; let lastToken = ""; response.data.on('data', async (d: Uint8Array) => { progress.report({ message: "Generating..." }); // Check for user input (cancel) if (lastToken != "") { const lastInput = document.getText(new vscode.Range(oldPosition, textEditor.selection.active)); if (lastInput !== lastToken) { axiosCancelPost(); // cancel axios => cancel finished promise => close notification return; } } // Get a completion from the response const completion: string = JSON.parse(d.toString()).response; lastToken = completion; //complete edit for token const edit = new vscode.WorkspaceEdit(); const range = new vscode.Position( currentPosition.line, currentPosition.character ); edit.insert(document.uri, range, completion); await vscode.workspace.applyEdit(edit); // Move the cursor to the end of the completion const completionLines = completion.split("\n"); const newPosition = new vscode.Position( currentPosition.line + completionLines.length - 1, (completionLines.length > 1 ? 0 : currentPosition.character) + completionLines[completionLines.length - 1].length ); const newSelection = new vscode.Selection( newPosition, newPosition ); oldPosition = currentPosition; currentPosition = newPosition; // completion bar progress.report({ message: "Generating...", increment: 1 / (numPredict / 100) }); // move cursor const editor = vscode.window.activeTextEditor; if (editor) editor.selection = newSelection; }); // Keep cancel window available const finished = new Promise((resolve) => { response.data.on('end', () => { progress.report({ message: "Ollama completion finished." }); resolve(true); }); axiosCancelToken.promise.finally(() => { // prevent notification from freezing on user input cancel resolve(false); }); }); await finished; } catch (err: any) { // Show an error message vscode.window.showErrorMessage( "Ollama encountered an error: " + err.message ); console.log(err); } } ); } // This method is called when extension is activated function activate(context: vscode.ExtensionContext) { // Register a completion provider for JavaScript files const completionProvider = vscode.languages.registerCompletionItemProvider("*", { async provideCompletionItems(document, position, cancellationToken) { // Create a completion item const item = new vscode.CompletionItem("Autocomplete with Ollama"); // Set the insert text to a placeholder item.insertText = new vscode.SnippetString('${1:}'); // Wait before initializing Ollama to reduce compute usage if (responsePreview) await new Promise(resolve => setTimeout(resolve, responsePreviewDelay * 1000)); if (cancellationToken.isCancellationRequested) { return [ item ]; } // Set the label & inset text to a shortened, non-stream response if (responsePreview) { let prompt = document.getText(new vscode.Range(document.lineAt(0).range.start, position)); prompt = prompt.substring(Math.max(0, prompt.length - promptWindowSize), prompt.length); const response_preview = await axios.post(apiEndpoint, { model: apiModel, // Change this to the model you want to use prompt: prompt, stream: false, system: apiSystemMessage, raw: rawInput, options: { num_predict: responsePreviewMaxTokens, // reduced compute max stop: ['\n'] } }, { cancelToken: new axios.CancelToken((c) => { const cancelPost = function () { c("Autocompletion request terminated by completion cancel"); }; cancellationToken.onCancellationRequested(cancelPost); }) }); if (response_preview.data.response.trim() != "") { // default if empty item.label = response_preview.data.response.trimStart(); // tended to add whitespace at the beginning item.insertText = response_preview.data.response.trimStart(); } } // Set the documentation to a message item.documentation = new vscode.MarkdownString('Press `Enter` to get an autocompletion from Ollama'); // Set the command to trigger the completion if (continueInline || !responsePreview) item.command = { command: 'ollama-autocoder.autocomplete', title: 'Autocomplete with Ollama', arguments: [cancellationToken] }; // Return the completion item return [item]; }, }, ...completionKeys.split("") ); // Register a command for getting a completion from Ollama through command/keybind const externalAutocompleteCommand = vscode.commands.registerTextEditorCommand( "ollama-autocoder.autocomplete", (textEditor, _, cancellationToken?) => { // no cancellation token from here, but there is one from completionProvider autocompleteCommand(textEditor, cancellationToken); } ); // Add the commands & completion provider to the context context.subscriptions.push(completionProvider); context.subscriptions.push(externalAutocompleteCommand); } // This method is called when extension is deactivated function deactivate() { } module.exports = { activate, deactivate, };