File tree Expand file tree Collapse file tree 2 files changed +12
-8
lines changed
internal/namespaces/inference/v1beta1 Expand file tree Collapse file tree 2 files changed +12
-8
lines changed Original file line number Diff line number Diff line change @@ -32,15 +32,19 @@ func endpointCreateBuilder(c *core.Command) *core.Command {
32
32
createEndpointCustomRequest := argsI .(* createEndpointRequestCustom )
33
33
createEndpointreq := createEndpointCustomRequest .CreateEndpointRequest
34
34
endpoint := createEndpointCustomRequest .Endpoint
35
+ endpointToCreate := inference.EndpointSpec {
36
+ Public : nil ,
37
+ PrivateNetwork : nil ,
38
+ DisableAuth : endpoint .DisableAuth ,
39
+ }
35
40
if endpoint .IsPublic {
36
41
publicEndpoint := & inference.EndpointSpecPublic {}
37
- endpointToCreate := inference.EndpointSpec {
38
- Public : publicEndpoint ,
39
- PrivateNetwork : nil ,
40
- DisableAuth : endpoint .DisableAuth ,
41
- }
42
- createEndpointreq .Endpoint = & endpointToCreate
42
+ endpointToCreate .Public = publicEndpoint
43
+ }
44
+ if endpoint .PrivateNetwork != nil && endpoint .PrivateNetwork .PrivateNetworkID != "" {
45
+ endpointToCreate .PrivateNetwork = & inference.EndpointSpecPrivateNetwork {PrivateNetworkID : endpoint .PrivateNetwork .PrivateNetworkID }
43
46
}
47
+ createEndpointreq .Endpoint = & endpointToCreate
44
48
45
49
return runner (ctx , createEndpointreq )
46
50
}
Original file line number Diff line number Diff line change @@ -5,14 +5,14 @@ import "github.com/scaleway/scaleway-cli/v2/core"
5
5
func CreateDeploymentPublicEndpoint () core.BeforeFunc {
6
6
return core .ExecStoreBeforeCmd (
7
7
"DEPLOYMENT" ,
8
- "scw inference deployment create node-type=H100 accept-eula=true model-name=meta/llama-2-70b-chat:fp8 -w" ,
8
+ "scw inference deployment create node-type=H100 accept-eula=true model-name=mistral/mistral-7b-instruct-v0.3:bf16 -w" ,
9
9
)
10
10
}
11
11
12
12
func CreateDeploymentPrivateEndpoint () core.BeforeFunc {
13
13
return core .ExecStoreBeforeCmd (
14
14
"DEPLOYMENT" ,
15
- "scw inference deployment create node-type=H100 accept-eula=true model-name=meta/llama-2-70b-chat:fp8 endpoints.0.private-network.private-network-id={{ .PN.ID }} -w" ,
15
+ "scw inference deployment create node-type=H100 accept-eula=true model-name=mistral/mistral-7b-instruct-v0.3:bf16 endpoints.0.private-network.private-network-id={{ .PN.ID }} -w" ,
16
16
)
17
17
}
18
18
You can’t perform that action at this time.
0 commit comments