diff --git a/internal/namespaces/inference/v1beta1/custom_endpoint.go b/internal/namespaces/inference/v1beta1/custom_endpoint.go index 95641460f9..f204591113 100644 --- a/internal/namespaces/inference/v1beta1/custom_endpoint.go +++ b/internal/namespaces/inference/v1beta1/custom_endpoint.go @@ -32,15 +32,19 @@ func endpointCreateBuilder(c *core.Command) *core.Command { createEndpointCustomRequest := argsI.(*createEndpointRequestCustom) createEndpointreq := createEndpointCustomRequest.CreateEndpointRequest endpoint := createEndpointCustomRequest.Endpoint + endpointToCreate := inference.EndpointSpec{ + Public: nil, + PrivateNetwork: nil, + DisableAuth: endpoint.DisableAuth, + } if endpoint.IsPublic { publicEndpoint := &inference.EndpointSpecPublic{} - endpointToCreate := inference.EndpointSpec{ - Public: publicEndpoint, - PrivateNetwork: nil, - DisableAuth: endpoint.DisableAuth, - } - createEndpointreq.Endpoint = &endpointToCreate + endpointToCreate.Public = publicEndpoint + } + if endpoint.PrivateNetwork != nil && endpoint.PrivateNetwork.PrivateNetworkID != "" { + endpointToCreate.PrivateNetwork = &inference.EndpointSpecPrivateNetwork{PrivateNetworkID: endpoint.PrivateNetwork.PrivateNetworkID} } + createEndpointreq.Endpoint = &endpointToCreate return runner(ctx, createEndpointreq) } diff --git a/internal/namespaces/inference/v1beta1/helper_test.go b/internal/namespaces/inference/v1beta1/helper_test.go index 3b8b55cecc..e5ef4b7962 100644 --- a/internal/namespaces/inference/v1beta1/helper_test.go +++ b/internal/namespaces/inference/v1beta1/helper_test.go @@ -5,14 +5,14 @@ import "github.com/scaleway/scaleway-cli/v2/core" func CreateDeploymentPublicEndpoint() core.BeforeFunc { return core.ExecStoreBeforeCmd( "DEPLOYMENT", - "scw inference deployment create node-type=H100 accept-eula=true model-name=meta/llama-2-70b-chat:fp8 -w", + "scw inference deployment create node-type=H100 accept-eula=true model-name=mistral/mistral-7b-instruct-v0.3:bf16 -w", ) } func CreateDeploymentPrivateEndpoint() core.BeforeFunc { return core.ExecStoreBeforeCmd( "DEPLOYMENT", - "scw inference deployment create node-type=H100 accept-eula=true model-name=meta/llama-2-70b-chat:fp8 endpoints.0.private-network.private-network-id={{ .PN.ID }} -w", + "scw inference deployment create node-type=H100 accept-eula=true model-name=mistral/mistral-7b-instruct-v0.3:bf16 endpoints.0.private-network.private-network-id={{ .PN.ID }} -w", ) }