generated from SAP/repository-template
-
Notifications
You must be signed in to change notification settings - Fork 15
/
Copy pathdeployment-resolver.ts
214 lines (193 loc) · 5.62 KB
/
deployment-resolver.ts
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
import { ErrorWithCause } from '@sap-cloud-sdk/util';
import {
type AiDeployment,
DeploymentApi
} from '../client/AI_CORE_API/index.js';
import { deploymentCache } from './deployment-cache.js';
import { extractModel, type FoundationModel } from './model.js';
import type { HttpDestinationOrFetchOptions } from '@sap-cloud-sdk/connectivity';
/**
* The model deployment configuration when using a model.
* @typeParam ModelNameT - String literal type representing the name of the model.
*/
export interface ModelConfig<ModelNameT = string> {
/**
* The name of the model.
*/
modelName: ModelNameT;
/**
* The version of the model.
*/
modelVersion?: string;
}
/**
* The deployment configuration when using a deployment ID.
*/
export interface DeploymentIdConfig {
/**
* The deployment ID.
*/
deploymentId: string;
}
/**
* The deployment configuration when using a resource group.
*/
export interface ResourceGroupConfig {
/**
* The resource group of the deployment.
*/
resourceGroup?: string;
}
/**
* The configuration of a model deployment.
* @typeParam ModelNameT - String literal type representing the name of the model.
*/
export type ModelDeployment<ModelNameT = string> =
| ModelNameT
| ((ModelConfig<ModelNameT> | DeploymentIdConfig) & ResourceGroupConfig);
/**
* @internal
*/
export function getResourceGroup(
modelDeployment: ModelDeployment
): string | undefined {
return typeof modelDeployment === 'object'
? modelDeployment.resourceGroup
: undefined;
}
/**
* Type guard to check if the given deployment configuration is a deployment ID configuration.
* @param modelDeployment - Configuration to check.
* @returns `true` if the configuration is a deployment ID configuration, `false` otherwise.
*/
function isDeploymentIdConfig(
modelDeployment: ModelDeployment
): modelDeployment is DeploymentIdConfig {
return (
typeof modelDeployment === 'object' && 'deploymentId' in modelDeployment
);
}
/**
* The options for the deployment resolution.
* @internal
*/
export interface DeploymentResolutionOptions {
/**
* The scenario ID of the deployment.
*/
scenarioId: string;
/**
* The name and potentially version of the model to look for.
*/
model?: FoundationModel;
/**
* The executable ID of the deployment.
*/
executableId?: string;
/**
* The resource group of the deployment.
*/
resourceGroup?: string;
/**
* The destination to use for the request.
*/
destination?: HttpDestinationOrFetchOptions;
}
/**
* Query the AI Core service for a deployment that matches the given criteria. If more than one deployment matches the criteria, the first one's ID is returned.
* @param opts - The options for the deployment resolution.
* @returns A promise of a deployment, if a deployment was found, fails otherwise.
* @internal
*/
export async function resolveDeploymentId(
opts: DeploymentResolutionOptions
): Promise<string> {
const { model } = opts;
const cachedDeployment = deploymentCache.get(opts);
if (cachedDeployment?.id) {
return cachedDeployment.id;
}
let deployments = await getAllDeployments(opts);
if (model) {
deployments = deployments.filter(
deployment => extractModel(deployment)?.name === model.name
);
if (model.version) {
deployments = deployments.filter(
deployment => extractModel(deployment)?.version === model.version
);
}
}
if (!deployments.length) {
throw new Error(
`No deployment matched the given criteria: ${JSON.stringify(opts)}. Make sure the deployment is successful, as it is a prerequisite before consuming orchestration or foundation models.`
);
}
return deployments[0].id;
}
/**
* Get all deployments that match the given criteria.
* @param opts - The options for the deployment resolution.
* @returns A promise of an array of deployments.
* @internal
*/
export async function getAllDeployments(
opts: DeploymentResolutionOptions
): Promise<AiDeployment[]> {
const {
destination,
scenarioId,
executableId,
resourceGroup = 'default'
} = opts;
try {
const { resources } = await DeploymentApi.deploymentQuery(
{
scenarioId,
status: 'RUNNING',
...(executableId && { executableIds: [executableId] })
},
{ 'AI-Resource-Group': resourceGroup }
).execute(destination);
deploymentCache.setAll(opts, resources);
return resources;
} catch (error: any) {
throw new ErrorWithCause('Failed to fetch the list of deployments.', error);
}
}
/**
* Get the deployment ID for a given model deployment configuration and executable ID using the 'foundation-models' scenario.
* @param modelDeployment - The model deployment configuration.
* @param executableId - The executable ID.
* @returns The ID of the deployment, if found.
* @internal
*/
export async function getDeploymentId(
modelDeployment: ModelDeployment,
executableId: string,
destination?: HttpDestinationOrFetchOptions
): Promise<string> {
if (isDeploymentIdConfig(modelDeployment)) {
return modelDeployment.deploymentId;
}
const model =
typeof modelDeployment === 'string'
? { modelName: modelDeployment }
: modelDeployment;
return resolveDeploymentId({
scenarioId: 'foundation-models',
executableId,
model: translateToFoundationModel(model),
resourceGroup: model.resourceGroup,
destination
});
}
function translateToFoundationModel(modelConfig: ModelConfig): FoundationModel {
if (typeof modelConfig === 'string') {
return { name: modelConfig };
}
return {
name: modelConfig.modelName,
...(modelConfig.modelVersion && { version: modelConfig.modelVersion })
};
}