heroku · sbosio · Sep 28, 2024 · Sep 27, 2024 · Sep 27, 2024 · Sep 27, 2024
@@ -28,6 +28,7 @@ USAGE
 * [`heroku ai:docs`](#heroku-aidocs)
 * [`heroku ai:models`](#heroku-aimodels)
 * [`heroku ai:models:attach MODEL_RESOURCE`](#heroku-aimodelsattach-model_resource)
+* [`heroku ai:models:call MODEL_RESOURCE`](#heroku-aimodelscall-model_resource)
 * [`heroku ai:models:create MODEL_NAME`](#heroku-aimodelscreate-model_name)
 * [`heroku ai:models:destroy MODELRESOURCE`](#heroku-aimodelsdestroy-modelresource)
 * [`heroku ai:models:detach MODEL_RESOURCE`](#heroku-aimodelsdetach-model_resource)
@@ -97,6 +98,39 @@ EXAMPLES
 
 _See code: [dist/commands/ai/models/attach.ts](https://github.com/heroku/heroku-cli-plugin-integration/blob/v0.0.0/dist/commands/ai/models/attach.ts)_
 
+## `heroku ai:models:call MODEL_RESOURCE`
+
+make an inference request to a specific AI model resource
+
+```
+USAGE
+  $ heroku ai:models:call [MODEL_RESOURCE] -p <value> [-a <value>] [--browser <value>] [-j] [--optfile <value>]
+    [--opts <value>] [-o <value>] [-r <value>]
+
+ARGUMENTS
+  MODEL_RESOURCE  The resource ID or alias of the model to call.
+
+FLAGS
+  -a, --app=<value>     app to run command against
+  -j, --json            Output response as JSON
+  -o, --output=<value>  The file path where the command writes the model response.
+  -p, --prompt=<value>  (required) The input prompt for the model.
+  -r, --remote=<value>  git remote of app to use
+  --browser=<value>     browser to open URLs with (example: "firefox", "safari")
+  --optfile=<value>     Additional options for model inference, provided as a JSON config file.
+  --opts=<value>        Additional options for model inference, provided as a JSON string.
+
+DESCRIPTION
+  make an inference request to a specific AI model resource
+
+EXAMPLES
+  $ heroku ai:models:call my_llm --app my-app --prompt "What is the meaning of life?"
+
+  $ heroku ai:models:call sdxl --app my-app --prompt "Generate an image of a sunset" --opts '{"quality":"hd"}' -o sunset.png
+```
+
+_See code: [dist/commands/ai/models/call.ts](https://github.com/heroku/heroku-cli-plugin-integration/blob/v0.0.0/dist/commands/ai/models/call.ts)_
+
 ## `heroku ai:models:create MODEL_NAME`
 
 provision access to an AI model

@@ -1,8 +1,5 @@
-import color from '@heroku-cli/color'
 import {flags} from '@heroku-cli/command'
-import {ux} from '@oclif/core'
-import {CLIError} from '@oclif/core/lib/errors'
-import open from 'open'
+import {openUrl} from '../../lib/open-url'
 import Command from '../../lib/base'
 
 export default class Docs extends Command {
@@ -12,39 +9,11 @@ export default class Docs extends Command {
     browser: flags.string({description: 'browser to open docs with (example: "firefox", "safari")'}),
   }
 
-  static urlOpener: (...args: Parameters<typeof open>) => ReturnType<typeof open> = open
-
   public async run(): Promise<void> {
     const {flags} = await this.parse(Docs)
     const browser = flags.browser
     const url = process.env.HEROKU_AI_DOCS_URL || Docs.defaultUrl
 
-    let browserErrorShown = false
-    const showBrowserError = (browser?: string) => {
-      if (browserErrorShown) return
-
-      ux.warn(`Unable to open ${browser ? browser : 'your default'} browser. Please visit ${color.cyan(url)} to view the documentation.`)
-      browserErrorShown = true
-    }
-
-    ux.log(`Opening ${color.cyan(url)} in ${browser ? browser : 'your default'} browser…`)
-
-    try {
-      await ux.anykey(
-        `Press any key to open up the browser to show Heroku AI documentation, or ${color.yellow('q')} to exit`
-      )
-    } catch (error) {
-      const {message, oclif} = error as CLIError
-      ux.error(message, {exit: oclif?.exit || 1})
-    }
-
-    const cp = await Docs.urlOpener(url, {wait: false, ...(browser ? {app: {name: browser}} : {})})
-    cp.on('error', (err: Error) => {
-      ux.warn(err)
-      showBrowserError(browser)
-    })
-    cp.on('close', (code: number) => {
-      if (code !== 0) showBrowserError(browser)
-    })
+    await openUrl(url, browser, 'view the documentation')
   }
 }
@@ -0,0 +1,225 @@
+import color from '@heroku-cli/color'
+import {flags} from '@heroku-cli/command'
+import {Args, ux} from '@oclif/core'
+import fs from 'node:fs'
+import {ChatCompletionResponse, EmbeddingResponse, ImageResponse, ModelList} from '../../../lib/ai/types'
+import Command from '../../../lib/base'
+import {openUrl} from '../../../lib/open-url'
+
+export default class Call extends Command {
+  static args = {
+    model_resource: Args.string({
+      description: 'The resource ID or alias of the model to call.',
+      required: true,
+    }),
+  }
+
+  static description = 'make an inference request to a specific AI model resource'
+  static examples = [
+    'heroku ai:models:call my_llm --app my-app --prompt "What is the meaning of life?"',
+    'heroku ai:models:call sdxl --app my-app --prompt "Generate an image of a sunset" --opts \'{"quality":"hd"}\' -o sunset.png',
+  ]
+
+  static flags = {
+    app: flags.app({required: false}),
+    // interactive: flags.boolean({
+    //   char: 'i',
+    //   description: 'Use interactive mode for conversation beyond the initial prompt (not available on all models)',
+    //   default: false,
+    // }),
+    browser: flags.string({description: 'browser to open URLs with (example: "firefox", "safari")'}),
+    json: flags.boolean({char: 'j', description: 'Output response as JSON'}),
+    optfile: flags.string({
+      description: 'Additional options for model inference, provided as a JSON config file.',
+      required: false,
+    }),
+    opts: flags.string({
+      description: 'Additional options for model inference, provided as a JSON string.',
+      required: false,
+    }),
+    output: flags.string({
+      char: 'o',
+      // description: 'The file path where the command writes the model response. If used with --interactive, this flag writes the entire exchange when the session closes.',
+      description: 'The file path where the command writes the model response.',
+      required: false,
+    }),
+    prompt: flags.string({
+      char: 'p',
+      description: 'The input prompt for the model.',
+      required: true,
+    }),
+    remote: flags.remote(),
+  }
+
+  public async run(): Promise<void> {
+    const {args, flags} = await this.parse(Call)
+    const {model_resource: modelResource} = args
+    const {app, browser, json, optfile, opts, output, prompt} = flags
+
+    // Initially, configure the default client to fetch the available model classes
+    await this.configureHerokuAIClient()
+    const {body: availableModels} = await this.herokuAI.get<ModelList>('/available-models')
+
+    // Now, configure the client to send a request for the target model resource
+    await this.configureHerokuAIClient(modelResource, app)
+    const options = this.parseOptions(optfile, opts)
+    // Not sure why `type` is an array in ModelListItem, we use the type from the first entry.
+    const modelType = availableModels.find(m => m.model_id === this.apiModelId)?.type[0]
+
+    switch (modelType) {
+    case 'Embedding': {
+      const embedding = await this.createEmbedding(prompt, options)
+      await this.displayEmbedding(embedding, output, json)
+      break
+    }
+
+    case 'Text-to-Image': {
+      const image = await this.generateImage(prompt, options)
+      await this.displayImageResult(image, output, browser, json)
+      break
+    }
+
+    case 'Text-to-Text': {
+      const completion = await this.createChatCompletion(prompt, options)
+      await this.displayChatCompletion(completion, output, json)
+      break
+    }
+
+    default:
+      throw new Error(`Unsupported model type: ${modelType}`)
+    }
+  }
+
+  /**
+   * Parse the model call request options from the command flags.
+   *
+   * @param optfile Path to a JSON file containing options.
+   * @param opts JSON string containing options.
+   * @returns The parsed options as an object.
+   */
+  private parseOptions(optfile?: string, opts?: string) {
+    const options = {}
+
+    if (optfile) {
+      const optfileContents = fs.readFileSync(optfile)
+
+      try {
+        Object.assign(options, JSON.parse(optfileContents.toString()))
+      } catch (error: unknown) {
+        if (error instanceof SyntaxError) {
+          const {message} = error as SyntaxError
+          return ux.error(
+            `Invalid JSON in ${color.yellow(optfile)}. Check the formatting in your file.\n${message}`,
+            {exit: 1},
+          )
+        }
+
+        throw error
+      }
+    }
+
+    if (opts) {
+      try {
+        Object.assign(options, JSON.parse(opts))
+      } catch (error: unknown) {
+        if (error instanceof SyntaxError) {
+          const {message} = error as SyntaxError
+          return ux.error(
+            `Invalid JSON. Check the formatting in your ${color.yellow('--opts')} value.\n${message}`,
+            {exit: 1},
+          )
+        }
+
+        throw error
+      }
+    }
+
+    return options
+  }
+
+  private async createChatCompletion(prompt: string, options = {}) {
+    const {body: chatCompletionResponse} = await this.herokuAI.post<ChatCompletionResponse>('/v1/chat/completions', {
+      body: {
+        ...options,
+        model: this.apiModelId,
+        messages: [{
+          role: 'user',
+          content: prompt,
+        }],
+      },
+      headers: {authorization: `Bearer ${this.apiKey}`},
+    })
+
+    return chatCompletionResponse
+  }
+
+  private async displayChatCompletion(completion: ChatCompletionResponse, output?: string, json = false) {
+    const content = completion.choices[0].message.content || ''
+
+    if (output) {
+      fs.writeFileSync(output, json ? JSON.stringify(completion, null, 2) : content)
+    } else {
+      json ? ux.styledJSON(completion) : ux.log(content)
+    }
+  }
+
+  private async generateImage(prompt: string, options = {}) {
+    const {body: imageResponse} = await this.herokuAI.post<ImageResponse>('/v1/images/generations', {
+      body: {
+        ...options,
+        model: this.apiModelId,
+        prompt,
+      },
+      headers: {authorization: `Bearer ${this.apiKey}`},
+    })
+
+    return imageResponse
+  }
+
+  private async displayImageResult(image: ImageResponse, output?: string, browser?: string, json = false) {
+    if (image.data[0].b64_json) {
+      if (output) {
+        const content = json ? JSON.stringify(image, null, 2) : Buffer.from(image.data[0].b64_json, 'base64')
+        fs.writeFileSync(output, content)
+      } else
+        json ? ux.styledJSON(image) : process.stdout.write(image.data[0].b64_json)
+      return
+    }
+
+    if (image.data[0].url) {
+      if (output)
+        fs.writeFileSync(output, json ? JSON.stringify(image, null, 2) : image.data[0].url)
+      else if (json)
+        ux.styledJSON(image)
+      else
+        await openUrl(image.data[0].url, browser, 'view the image')
+      return
+    }
+
+    // This should never happen, but we'll handle it anyway
+    ux.error('Unexpected response format', {exit: 1})
+  }
+
+  private async createEmbedding(input: string, options = {}) {
+    const {body: EmbeddingResponse} = await this.herokuAI.post<EmbeddingResponse>('/v1/embeddings', {
+      body: {
+        ...options,
+        model: this.apiModelId,
+        input,
+      },
+      headers: {authorization: `Bearer ${this.apiKey}`},
+    })
+
+    return EmbeddingResponse
+  }
+
+  private async displayEmbedding(embedding: EmbeddingResponse, output?: string, json = false) {
+    const content = (embedding.data[0].embeddings || []).toString()
+
+    if (output) {
+      fs.writeFileSync(output, json ? JSON.stringify(embedding, null, 2) : content)
+    } else {
+      json ? ux.styledJSON(embedding) : ux.log(content)
+    }
+  }
+}