Merge 93540b5af9a5bac27e7d79c2e1ef80332e4232ff into 598f1826d8b2bc969aace2c6459824737667218c
This commit is contained in:
commit
4ccf494c52
@ -60,4 +60,28 @@ describe("media-understanding provider registry", () => {
|
||||
|
||||
expect(provider?.id).toBe("google");
|
||||
});
|
||||
|
||||
it("auto-registers media-understanding for config providers with image-capable models (#51392)", () => {
|
||||
const cfg = {
|
||||
models: {
|
||||
providers: {
|
||||
glm: {
|
||||
models: [{ id: "glm-4.6v", input: ["text", "image"] }],
|
||||
},
|
||||
textOnly: {
|
||||
models: [{ id: "text-model", input: ["text"] }],
|
||||
},
|
||||
},
|
||||
},
|
||||
} as never;
|
||||
const registry = buildMediaUnderstandingRegistry(undefined, cfg);
|
||||
const glmProvider = getMediaUnderstandingProvider("glm", registry);
|
||||
const textOnlyProvider = getMediaUnderstandingProvider("textOnly", registry);
|
||||
|
||||
expect(glmProvider?.id).toBe("glm");
|
||||
expect(glmProvider?.capabilities).toEqual(["image"]);
|
||||
expect(glmProvider?.describeImage).toBeDefined();
|
||||
expect(glmProvider?.describeImages).toBeDefined();
|
||||
expect(textOnlyProvider).toBeUndefined();
|
||||
});
|
||||
});
|
||||
|
||||
@ -5,6 +5,10 @@ import { getActivePluginRegistry } from "../../plugins/runtime.js";
|
||||
import type { MediaUnderstandingProvider } from "../types.js";
|
||||
import { deepgramProvider } from "./deepgram/index.js";
|
||||
import { groqProvider } from "./groq/index.js";
|
||||
import {
|
||||
describeImageWithModel,
|
||||
describeImagesWithModel,
|
||||
} from "./image.js";
|
||||
|
||||
const PROVIDERS: MediaUnderstandingProvider[] = [groqProvider, deepgramProvider];
|
||||
|
||||
@ -48,6 +52,28 @@ export function buildMediaUnderstandingRegistry(
|
||||
for (const entry of pluginRegistry?.mediaUnderstandingProviders ?? []) {
|
||||
mergeProviderIntoRegistry(registry, entry.provider);
|
||||
}
|
||||
// Auto-register media-understanding for config providers with image-capable models (#51392)
|
||||
const configProviders = cfg?.models?.providers;
|
||||
if (configProviders && typeof configProviders === "object") {
|
||||
for (const [providerKey, providerCfg] of Object.entries(configProviders)) {
|
||||
if (!providerKey?.trim()) continue;
|
||||
const normalizedKey = normalizeMediaProviderId(providerKey);
|
||||
if (registry.has(normalizedKey)) continue;
|
||||
const models = (providerCfg as { models?: Array<{ input?: string[] }> })?.models ?? [];
|
||||
const hasImageModel = models.some(
|
||||
(m) => Array.isArray(m?.input) && m.input.includes("image"),
|
||||
);
|
||||
if (hasImageModel) {
|
||||
const autoProvider: MediaUnderstandingProvider = {
|
||||
id: normalizedKey,
|
||||
capabilities: ["image"],
|
||||
describeImage: describeImageWithModel,
|
||||
describeImages: describeImagesWithModel,
|
||||
};
|
||||
mergeProviderIntoRegistry(registry, autoProvider);
|
||||
}
|
||||
}
|
||||
}
|
||||
if (overrides) {
|
||||
for (const [key, provider] of Object.entries(overrides)) {
|
||||
const normalizedKey = normalizeMediaProviderId(key);
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user