add support for conversational state to assistance endpoint (#506)

* add support for conversational state to assistance endpoint This refactors the assistance code somewhat, to allow carrying along some conversational state. It extends the OpenAI-flavored assistant to make use of that state to have a conversation. The front-end is tweaked a little bit to allow for replies that don't have any code in them (though I didn't get into formatting such replies nicely). Currently tested primarily through the runCompletion script, which has been extended a bit to allow testing simulated conversations (where an error is pasted in follow-up, or an expected-vs-actual comparison). Co-authored-by: George Gevoian <85144792+georgegevoian@users.noreply.github.com>
2026-03-02 04:09:24 +00:00 · 2023-05-08 11:15:22 -07:00
parent 68fbeb4d7b
commit 51a195bd94
10 changed files with 587 additions and 185 deletions
--- a/app/server/lib/ActiveDoc.ts
+++ b/app/server/lib/ActiveDoc.ts
@@ -14,7 +14,7 @@ import {
 } from 'app/common/ActionBundle';
 import {ActionGroup, MinimalActionGroup} from 'app/common/ActionGroup';
 import {ActionSummary} from "app/common/ActionSummary";
-import {Prompt, Suggestion} from "app/common/AssistancePrompts";
+import {AssistanceRequest, AssistanceResponse} from "app/common/AssistancePrompts";
 import {
  AclResources,
  AclTableDescription,
@@ -85,7 +85,7 @@ import {Document} from 'app/gen-server/entity/Document';
 import {ParseOptions} from 'app/plugin/FileParserAPI';
 import {AccessTokenOptions, AccessTokenResult, GristDocAPI} from 'app/plugin/GristAPI';
 import {compileAclFormula} from 'app/server/lib/ACLFormula';
-import {sendForCompletion} from 'app/server/lib/Assistance';
+import {AssistanceDoc, AssistanceSchemaPromptV1Context, sendForCompletion} from 'app/server/lib/Assistance';
 import {Authorizer} from 'app/server/lib/Authorizer';
 import {checksumFile} from 'app/server/lib/checksumFile';
 import {Client} from 'app/server/lib/Client';
@@ -180,7 +180,7 @@ interface UpdateUsageOptions {
 * either .loadDoc() or .createEmptyDoc() is called.
 * @param {String} docName - The document's filename, without the '.grist' extension.
 */
-export class ActiveDoc extends EventEmitter {
+export class ActiveDoc extends EventEmitter implements AssistanceDoc {
  /**
   * Decorator for ActiveDoc methods that prevents shutdown while the method is running, i.e.
   * until the returned promise is resolved.
@@ -1112,7 +1112,7 @@ export class ActiveDoc extends EventEmitter {
   * @param {Integer} rowId - Row number
   * @returns {Promise} Promise for a error message
   */
-  public async getFormulaError(docSession: DocSession, tableId: string, colId: string,
+  public async getFormulaError(docSession: OptDocSession, tableId: string, colId: string,
                               rowId: number): Promise<CellValue> {
    // Throw an error if the user doesn't have access to read this cell.
    await this._granularAccess.getCellValue(docSession, {tableId, colId, rowId});
@@ -1260,22 +1260,28 @@ export class ActiveDoc extends EventEmitter {
    return this._pyCall('autocomplete', txt, tableId, columnId, rowId, user.toJSON());
  }

-  public async getAssistance(docSession: DocSession, userPrompt: Prompt): Promise<Suggestion> {
-    // Making a prompt can leak names of tables and columns.
+  public async getAssistance(docSession: DocSession, request: AssistanceRequest): Promise<AssistanceResponse> {
+    return this.getAssistanceWithOptions(docSession, request);
+  }
+
+  public async getAssistanceWithOptions(docSession: DocSession,
+                                        request: AssistanceRequest): Promise<AssistanceResponse> {
+    // Making a prompt leaks names of tables and columns etc.
    if (!await this._granularAccess.canScanData(docSession)) {
      throw new Error("Permission denied");
    }
    await this.waitForInitialization();
-    const { tableId, colId, description } = userPrompt;
-    const prompt = await this._pyCall('get_formula_prompt', tableId, colId, description);
-    this._log.debug(docSession, 'getAssistance prompt', {prompt});
-    const completion = await sendForCompletion(prompt);
-    this._log.debug(docSession, 'getAssistance completion', {completion});
-    const formula = await this._pyCall('convert_formula_completion', completion);
-    const action: DocAction = ["ModifyColumn", tableId, colId, {formula}];
-    return {
-      suggestedActions: [action],
-    };
+    return sendForCompletion(this, request);
+  }
+
+  // Callback to make a data-engine formula tweak for assistance.
+  public assistanceFormulaTweak(txt: string) {
+    return this._pyCall('convert_formula_completion', txt);
+  }
+
+  // Callback to generate a prompt containing schema info for assistance.
+  public assistanceSchemaPromptV1(options: AssistanceSchemaPromptV1Context): Promise<string> {
+    return this._pyCall('get_formula_prompt', options.tableId, options.colId, options.docString);
  }

  public fetchURL(docSession: DocSession, url: string, options?: FetchUrlOptions): Promise<UploadResult> {
--- a/app/server/lib/Assistance.ts
+++ b/app/server/lib/Assistance.ts
@@ -2,116 +2,320 @@
 * Module with functions used for AI formula assistance.
 */

+import {AssistanceRequest, AssistanceResponse} from 'app/common/AssistancePrompts';
 import {delay} from 'app/common/delay';
+import {DocAction} from 'app/common/DocActions';
 import log from 'app/server/lib/log';
 import fetch from 'node-fetch';

 export const DEPS = { fetch };

-export async function sendForCompletion(prompt: string): Promise<string> {
-  let completion: string|null = null;
-  let retries: number = 0;
-  const openApiKey = process.env.OPENAI_API_KEY;
-  const model = process.env.COMPLETION_MODEL || "text-davinci-002";
+/**
+ * An assistant can help a user do things with their document,
+ * by interfacing with an external LLM endpoint.
+ */
+export interface Assistant {
+  apply(doc: AssistanceDoc, request: AssistanceRequest): Promise<AssistanceResponse>;
+}

+/**
+ * Document-related methods for use in the implementation of assistants.
+ * Somewhat ad-hoc currently.
+ */
+export interface AssistanceDoc {
+  /**
+   * Generate a particular prompt coded in the data engine for some reason.
+   * It makes python code for some tables, and starts a function body with
+   * the given docstring.
+   * Marked "V1" to suggest that it is a particular prompt and it would
+   * be great to try variants.
+   */
+  assistanceSchemaPromptV1(options: AssistanceSchemaPromptV1Context): Promise<string>;
+
+  /**
+   * Some tweaks to a formula after it has been generated.
+   */
+  assistanceFormulaTweak(txt: string): Promise<string>;
+}
+
+export interface AssistanceSchemaPromptV1Context {
+  tableId: string,
+  colId: string,
+  docString: string,
+}
+
+/**
+ * A flavor of assistant for use with the OpenAI API.
+ * Tested primarily with text-davinci-002 and gpt-3.5-turbo.
+ */
+export class OpenAIAssistant implements Assistant {
+  private _apiKey: string;
+  private _model: string;
+  private _chatMode: boolean;
+  private _endpoint: string;
+
+  public constructor() {
+    const apiKey = process.env.OPENAI_API_KEY;
+    if (!apiKey) {
+      throw new Error('OPENAI_API_KEY not set');
+    }
+    this._apiKey = apiKey;
+    this._model = process.env.COMPLETION_MODEL || "text-davinci-002";
+    this._chatMode = this._model.includes('turbo');
+    this._endpoint = `https://api.openai.com/v1/${this._chatMode ? 'chat/' : ''}completions`;
+  }
+
+  public async apply(doc: AssistanceDoc, request: AssistanceRequest): Promise<AssistanceResponse> {
+    const messages = request.state?.messages || [];
+    const chatMode = this._chatMode;
+    if (chatMode) {
+      if (messages.length === 0) {
+        messages.push({
+          role: 'system',
+          content: 'The user gives you one or more Python classes, ' +
+            'with one last method that needs completing. Write the ' +
+            'method body as a single code block, ' +
+            'including the docstring the user gave. ' +
+            'Just give the Python code as a markdown block, ' +
+            'do not give any introduction, that will just be ' +
+            'awkward for the user when copying and pasting. ' +
+            'You are working with Grist, an environment very like ' +
+            'regular Python except `rec` (like record) is used ' +
+            'instead of `self`. ' +
+            'Include at least one `return` statement or the method ' +
+            'will fail, disappointing the user. ' +
+            'Your answer should be the body of a single method, ' +
+            'not a class, and should not include `dataclass` or ' +
+            '`class` since the user is counting on you to provide ' +
+            'a single method. Thanks!'
+        });
+        messages.push({
+          role: 'user', content: await makeSchemaPromptV1(doc, request),
+        });
+      } else {
+        if (request.regenerate) {
+          if (messages[messages.length - 1].role !== 'user') {
+            messages.pop();
+          }
+        }
+        messages.push({
+          role: 'user', content: request.text,
+        });
+      }
+    } else {
+      messages.length = 0;
+      messages.push({
+        role: 'user', content: await makeSchemaPromptV1(doc, request),
+      });
+    }
+
+    const apiResponse = await DEPS.fetch(
+      this._endpoint,
+      {
+        method: "POST",
+        headers: {
+          "Authorization": `Bearer ${this._apiKey}`,
+          "Content-Type": "application/json",
+        },
+        body: JSON.stringify({
+          ...(!this._chatMode ? {
+            prompt: messages[messages.length - 1].content,
+          } : { messages }),
+          max_tokens: 1500,
+          temperature: 0,
+          model: this._model,
+          stop: this._chatMode ? undefined : ["\n\n"],
+        }),
+      },
+    );
+    if (apiResponse.status !== 200) {
+      log.error(`OpenAI API returned ${apiResponse.status}: ${await apiResponse.text()}`);
+      throw new Error(`OpenAI API returned status ${apiResponse.status}`);
+    }
+    const result = await apiResponse.json();
+    let completion: string = String(chatMode ? result.choices[0].message.content : result.choices[0].text);
+    const reply = completion;
+    const history = { messages };
+    if (chatMode) {
+      history.messages.push(result.choices[0].message);
+      // This model likes returning markdown. Code will typically
+      // be in a code block with ``` delimiters.
+      let lines = completion.split('\n');
+      if (lines[0].startsWith('```')) {
+        lines.shift();
+        completion = lines.join('\n');
+        const parts = completion.split('```');
+        if (parts.length > 1) {
+          completion = parts[0];
+        }
+        lines = completion.split('\n');
+      }
+
+      // This model likes repeating the function signature and
+      // docstring, so we try to strip that out.
+      completion = lines.join('\n');
+      while (completion.includes('"""')) {
+        const parts = completion.split('"""');
+        completion = parts[parts.length - 1];
+      }
+
+      // If there's no code block, don't treat the answer as a formula.
+      if (!reply.includes('```')) {
+        completion = '';
+      }
+    }
+
+    const response = await completionToResponse(doc, request, completion, reply);
+    if (chatMode) {
+      response.state = history;
+    }
+    return response;
+  }
+}
+
+export class HuggingFaceAssistant implements Assistant {
+  private _apiKey: string;
+  private _completionUrl: string;
+
+  public constructor() {
+    const apiKey = process.env.HUGGINGFACE_API_KEY;
+    if (!apiKey) {
+      throw new Error('HUGGINGFACE_API_KEY not set');
+    }
+    this._apiKey = apiKey;
+    // COMPLETION_MODEL values I've tried:
+    //   - codeparrot/codeparrot
+    //   - NinedayWang/PolyCoder-2.7B
+    //   - NovelAI/genji-python-6B
+    let completionUrl = process.env.COMPLETION_URL;
+    if (!completionUrl) {
+      if (process.env.COMPLETION_MODEL) {
+        completionUrl = `https://api-inference.huggingface.co/models/${process.env.COMPLETION_MODEL}`;
+      } else {
+        completionUrl = 'https://api-inference.huggingface.co/models/NovelAI/genji-python-6B';
+      }
+    }
+    this._completionUrl = completionUrl;
+
+  }
+
+  public async apply(doc: AssistanceDoc, request: AssistanceRequest): Promise<AssistanceResponse> {
+    if (request.state) {
+      throw new Error("HuggingFaceAssistant does not support state");
+    }
+    const prompt = await makeSchemaPromptV1(doc, request);
+    const response = await DEPS.fetch(
+      this._completionUrl,
+      {
+        method: "POST",
+        headers: {
+          "Authorization": `Bearer ${this._apiKey}`,
+          "Content-Type": "application/json",
+        },
+        body: JSON.stringify({
+          inputs: prompt,
+          parameters: {
+            return_full_text: false,
+            max_new_tokens: 50,
+          },
+        }),
+      },
+    );
+    if (response.status === 503) {
+      log.error(`Sleeping for 10s - HuggingFace API returned ${response.status}: ${await response.text()}`);
+      await delay(10000);
+    }
+    if (response.status !== 200) {
+      const text = await response.text();
+      log.error(`HuggingFace API returned ${response.status}: ${text}`);
+      throw new Error(`HuggingFace API returned status ${response.status}: ${text}`);
+    }
+    const result = await response.json();
+    let completion = result[0].generated_text;
+    completion = completion.split('\n\n')[0];
+    return completionToResponse(doc, request, completion);
+  }
+}
+
+/**
+ * Instantiate an assistant, based on environment variables.
+ */
+function getAssistant() {
+  if (process.env.OPENAI_API_KEY) {
+    return new OpenAIAssistant();
+  }
+  if (process.env.HUGGINGFACE_API_KEY) {
+    return new HuggingFaceAssistant();
+  }
+  throw new Error('Please set OPENAI_API_KEY or HUGGINGFACE_API_KEY');
+}
+
+/**
+ * Service a request for assistance, with a little retry logic
+ * since these endpoints can be a bit flakey.
+ */
+export async function sendForCompletion(doc: AssistanceDoc,
+                                        request: AssistanceRequest): Promise<AssistanceResponse> {
+  const assistant = getAssistant();
+
+  let retries: number = 0;
+
+  let response: AssistanceResponse|null = null;
  while(retries++ < 3) {
    try {
-      if (openApiKey) {
-        completion = await sendForCompletionOpenAI(prompt, openApiKey, model);
-      }
-      if (process.env.HUGGINGFACE_API_KEY) {
-        completion = await sendForCompletionHuggingFace(prompt);
-      }
+      response = await assistant.apply(doc, request);
      break;
    } catch(e) {
+      log.error(`Completion error: ${e}`);
      await delay(1000);
    }
  }
-  if (completion === null) {
-    throw new Error("Please set OPENAI_API_KEY or HUGGINGFACE_API_KEY (and optionally COMPLETION_MODEL)");
+  if (!response) {
+    throw new Error('Failed to get response from assistant');
  }
-  log.debug(`Received completion:`, {completion});
-  completion = completion.split(/\n {4}[^ ]/)[0];
-  return completion;
+  return response;
 }

-
-async function sendForCompletionOpenAI(prompt: string, apiKey: string, model = "text-davinci-002") {
-  if (!apiKey) {
-    throw new Error("OPENAI_API_KEY not set");
+async function makeSchemaPromptV1(doc: AssistanceDoc, request: AssistanceRequest) {
+  if (request.context.type !== 'formula') {
+    throw new Error('makeSchemaPromptV1 only works for formulas');
  }
-  const response = await DEPS.fetch(
-    "https://api.openai.com/v1/completions",
-    {
-      method: "POST",
-      headers: {
-        "Authorization": `Bearer ${apiKey}`,
-        "Content-Type": "application/json",
-      },
-      body: JSON.stringify({
-        prompt,
-        max_tokens: 150,
-        temperature: 0,
-        // COMPLETION_MODEL of `code-davinci-002` may be better if you have access to it.
-        model,
-        stop: ["\n\n"],
-      }),
-    },
-  );
-  if (response.status !== 200) {
-    log.error(`OpenAI API returned ${response.status}: ${await response.text()}`);
-    throw new Error(`OpenAI API returned status ${response.status}`);
-  }
-  const result = await response.json();
-  const completion = result.choices[0].text;
-  return completion;
+  return doc.assistanceSchemaPromptV1({
+    tableId: request.context.tableId,
+    colId: request.context.colId,
+    docString: request.text,
+  });
 }

-async function sendForCompletionHuggingFace(prompt: string) {
-  const apiKey = process.env.HUGGINGFACE_API_KEY;
-  if (!apiKey) {
-    throw new Error("HUGGINGFACE_API_KEY not set");
+async function completionToResponse(doc: AssistanceDoc, request: AssistanceRequest,
+                                    completion: string, reply?: string): Promise<AssistanceResponse> {
+  if (request.context.type !== 'formula') {
+    throw new Error('completionToResponse only works for formulas');
  }
-  // COMPLETION_MODEL values I've tried:
-  //   - codeparrot/codeparrot
-  //   - NinedayWang/PolyCoder-2.7B
-  //   - NovelAI/genji-python-6B
-  let completionUrl = process.env.COMPLETION_URL;
-  if (!completionUrl) {
-    if (process.env.COMPLETION_MODEL) {
-      completionUrl = `https://api-inference.huggingface.co/models/${process.env.COMPLETION_MODEL}`;
-    } else {
-      completionUrl = 'https://api-inference.huggingface.co/models/NovelAI/genji-python-6B';
+  completion = await doc.assistanceFormulaTweak(completion);
+  // A leading newline is common.
+  if (completion.charAt(0) === '\n') {
+    completion = completion.slice(1);
+  }
+  // If all non-empty lines have four spaces, remove those spaces.
+  // They are common for GPT-3.5, which matches the prompt carefully.
+  const lines = completion.split('\n');
+  const ok = lines.every(line => line === '\n' || line.startsWith('    '));
+  if (ok) {
+    completion = lines.map(line => line === '\n' ? line : line.slice(4)).join('\n');
+  }
+
+  // Suggest an action only if the completion is non-empty (that is,
+  // it actually looked like code).
+  const suggestedActions: DocAction[] = completion ? [[
+    "ModifyColumn",
+    request.context.tableId,
+    request.context.colId, {
+      formula: completion,
    }
-  }
-
-  const response = await DEPS.fetch(
-    completionUrl,
-    {
-      method: "POST",
-      headers: {
-        "Authorization": `Bearer ${apiKey}`,
-        "Content-Type": "application/json",
-      },
-      body: JSON.stringify({
-        inputs: prompt,
-        parameters: {
-          return_full_text: false,
-          max_new_tokens: 50,
-        },
-      }),
-    },
-  );
-  if (response.status === 503) {
-    log.error(`Sleeping for 10s - HuggingFace API returned ${response.status}: ${await response.text()}`);
-    await delay(10000);
-  }
-  if (response.status !== 200) {
-    const text = await response.text();
-    log.error(`HuggingFace API returned ${response.status}: ${text}`);
-    throw new Error(`HuggingFace API returned status ${response.status}: ${text}`);
-  }
-  const result = await response.json();
-  const completion = result[0].generated_text;
-  return completion.split('\n\n')[0];
+  ]] : [];
+  return {
+    suggestedActions,
+    reply,
+  };
 }
--- a/app/server/lib/GranularAccess.ts
+++ b/app/server/lib/GranularAccess.ts
@@ -376,7 +376,8 @@ export class GranularAccess implements GranularAccessForBundle {
    function fail(): never {
      throw new ErrorWithCode('ACL_DENY', 'Cannot access cell');
    }
-    if (!await this.hasTableAccess(docSession, cell.tableId)) { fail(); }
+    const hasExceptionalAccess = this._hasExceptionalFullAccess(docSession);
+    if (!hasExceptionalAccess && !await this.hasTableAccess(docSession, cell.tableId)) { fail(); }
    let rows: TableDataAction|null = null;
    if (docData) {
      const record = docData.getTable(cell.tableId)?.getRecord(cell.rowId);
@@ -393,16 +394,18 @@ export class GranularAccess implements GranularAccessForBundle {
      return fail();
    }
    const rec = new RecordView(rows, 0);
-    const input: AclMatchInput = {...await this.inputs(docSession), rec, newRec: rec};
-    const rowPermInfo = new PermissionInfo(this._ruler.ruleCollection, input);
-    const rowAccess = rowPermInfo.getTableAccess(cell.tableId).perms.read;
-    if (rowAccess === 'deny') { fail(); }
-    if (rowAccess !== 'allow') {
-      const colAccess = rowPermInfo.getColumnAccess(cell.tableId, cell.colId).perms.read;
-      if (colAccess === 'deny') { fail(); }
+    if (!hasExceptionalAccess) {
+      const input: AclMatchInput = {...await this.inputs(docSession), rec, newRec: rec};
+      const rowPermInfo = new PermissionInfo(this._ruler.ruleCollection, input);
+      const rowAccess = rowPermInfo.getTableAccess(cell.tableId).perms.read;
+      if (rowAccess === 'deny') { fail(); }
+      if (rowAccess !== 'allow') {
+        const colAccess = rowPermInfo.getColumnAccess(cell.tableId, cell.colId).perms.read;
+        if (colAccess === 'deny') { fail(); }
+      }
+      const colValues = rows[3];
+      if (!(cell.colId in colValues)) { fail(); }
    }
-    const colValues = rows[3];
-    if (!(cell.colId in colValues)) { fail(); }
    return rec.get(cell.colId);
  }