-
Notifications
You must be signed in to change notification settings - Fork 38
/
Copy pathsagemaker_jumpstart_model-stack.ts
57 lines (50 loc) · 2.28 KB
/
sagemaker_jumpstart_model-stack.ts
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
/**
* Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
*
* Licensed under the Apache License, Version 2.0 (the "License"). You may not use this file except in compliance
* with the License. A copy of the License is located at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* or in the 'license' file accompanying this file. This file is distributed on an 'AS IS' BASIS, WITHOUT WARRANTIES
* OR CONDITIONS OF ANY KIND, express or implied. See the License for the specific language governing permissions
* and limitations under the License.
*/
import * as path from 'path';
import * as cdk from 'aws-cdk-lib';
import * as lambda from 'aws-cdk-lib/aws-lambda';
import { Construct } from 'constructs';
import * as genai from '@cdklabs/generative-ai-cdk-constructs';
export class SagemakerJumpstartModelStack extends cdk.Stack {
constructor(scope: Construct, id: string, props?: cdk.StackProps) {
super(scope, id, props);
// Define some constants
const SG_ENDPOINT_NAME = 'testllamatwo';
// Deploy Llama 2 7B version 2.0.2 from SageMaker Jumpstart to a real-time SageMaker endpoint
const JmpStrtTestConstruct = new genai.JumpStartSageMakerEndpoint(this, 'testllamatwosevenb', {
model: genai.JumpStartModel.META_TEXTGENERATION_LLAMA_2_7B_F_2_0_2,
instanceType: genai.SageMakerInstanceType.ML_G5_2XLARGE,
acceptEula: false,
endpointName: SG_ENDPOINT_NAME
});
this.templateOptions.description= 'Description: (uksb-1tupboc43) (tag: Sagemaker Jumpstart Model Stack)'
// Lambda request handler used to interact with the SageMaker endpoint
const requestHandler = new lambda.Function(this, 'DemoRequestHandlerJumpstart', {
code: lambda.Code.fromAsset(
path.join(__dirname, '../lambda')
),
functionName: 'lambdallama2',
handler: 'lambda.handler',
description: 'Lambda request handler used to interact with the SageMaker endpoint',
runtime: lambda.Runtime.PYTHON_3_12,
architecture: lambda.Architecture.ARM_64,
tracing: lambda.Tracing.ACTIVE,
timeout: cdk.Duration.minutes(15),
memorySize: 1024,
environment: {
'ENDPOINT_NAME': JmpStrtTestConstruct.cfnEndpoint.endpointName!
}
});
JmpStrtTestConstruct.grantInvoke(requestHandler);
}
}