From 7ae110494f40bea666c435ebbc9726c70b424651 Mon Sep 17 00:00:00 2001 From: Krzysztof Nozderko Date: Tue, 26 Nov 2024 17:14:38 +0100 Subject: [PATCH 1/2] SNOW-1789757 Support GCP region specific endpoint --- .../UnitTests/PutGetStageInfoTest.cs | 59 +++++++++++++++++++ .../UnitTests/SFGCSClientTest.cs | 33 ++++++++++- .../FileTransfer/StorageClient/SFGCSClient.cs | 50 ++++++++++++---- Snowflake.Data/Core/RestResponse.cs | 17 ++++++ 4 files changed, 147 insertions(+), 12 deletions(-) create mode 100644 Snowflake.Data.Tests/UnitTests/PutGetStageInfoTest.cs diff --git a/Snowflake.Data.Tests/UnitTests/PutGetStageInfoTest.cs b/Snowflake.Data.Tests/UnitTests/PutGetStageInfoTest.cs new file mode 100644 index 000000000..85a34b222 --- /dev/null +++ b/Snowflake.Data.Tests/UnitTests/PutGetStageInfoTest.cs @@ -0,0 +1,59 @@ +using System.Collections.Generic; +using NUnit.Framework; +using Snowflake.Data.Core; +using Snowflake.Data.Core.FileTransfer; + +namespace Snowflake.Data.Tests.UnitTests +{ + [TestFixture] + public class PutGetStageInfoTest + { + [Test] + [TestCaseSource(nameof(TestCases))] + public void TestGcmRegionalUrl(string region, bool useRegionalUrl, string endPoint, string expectedGcmEndpoint) + { + // arrange + var stageInfo = CreateGCSStageInfo(region, useRegionalUrl, endPoint); + + // act + var gcsCustomEndpoint = stageInfo.GcsCustomEndpoint(); + + // assert + Assert.AreEqual(expectedGcmEndpoint, gcsCustomEndpoint); + } + + internal static IEnumerable TestCases() + { + yield return new object[] { "US-CENTRAL1", false, null, null }; + yield return new object[] { "US-CENTRAL1", false, "", null }; + yield return new object[] { "US-CENTRAL1", false, "null", null }; + yield return new object[] { "US-CENTRAL1", false, " ", null }; + yield return new object[] { "US-CENTRAL1", false, "example.com", "example.com" }; + yield return new object[] { "ME-CENTRAL2", false, null, "storage.me-central2.rep.googleapis.com" }; + yield return new object[] { "ME-CENTRAL2", true, null, "storage.me-central2.rep.googleapis.com" }; + yield return new object[] { "ME-CENTRAL2", true, "", "storage.me-central2.rep.googleapis.com" }; + yield return new object[] { "ME-CENTRAL2", true, " ", "storage.me-central2.rep.googleapis.com" }; + yield return new object[] { "ME-CENTRAL2", true, "example.com", "example.com" }; + yield return new object[] { "US-CENTRAL1", true, null, "storage.us-central1.rep.googleapis.com" }; + yield return new object[] { "US-CENTRAL1", true, "", "storage.us-central1.rep.googleapis.com" }; + yield return new object[] { "US-CENTRAL1", true, " ", "storage.us-central1.rep.googleapis.com" }; + yield return new object[] { "US-CENTRAL1", true, "null", "storage.us-central1.rep.googleapis.com" }; + yield return new object[] { "US-CENTRAL1", true, "example.com", "example.com" }; + } + + private PutGetStageInfo CreateGCSStageInfo(string region, bool useRegionalUrl, string endPoint) => + new PutGetStageInfo + { + locationType = SFRemoteStorageUtil.GCS_FS, + location = "some location", + path = "some path", + region = region, + storageAccount = "some storage account", + isClientSideEncrypted = true, + stageCredentials = new Dictionary(), + presignedUrl = "some pre-signed url", + endPoint = endPoint, + useRegionalUrl = useRegionalUrl + }; + } +} diff --git a/Snowflake.Data.Tests/UnitTests/SFGCSClientTest.cs b/Snowflake.Data.Tests/UnitTests/SFGCSClientTest.cs index d47742743..599a0b29b 100644 --- a/Snowflake.Data.Tests/UnitTests/SFGCSClientTest.cs +++ b/Snowflake.Data.Tests/UnitTests/SFGCSClientTest.cs @@ -18,7 +18,7 @@ namespace Snowflake.Data.Tests.UnitTests using Snowflake.Data.Tests.Mock; using Moq; - [TestFixture] + [TestFixture, NonParallelizable] class SFGCSClientTest : SFBaseTest { // Mock data for file metadata @@ -340,6 +340,37 @@ public async Task TestDownloadFileAsync(HttpStatusCode? httpStatusCode, ResultSt AssertForDownloadFileTests(expectedResultStatus); } + [Test] + [TestCase("us-central1", null, null, "https://storage.googleapis.com/mock-customer-stage/mock-id/tables/mock-key/")] + [TestCase("us-central1", "example.com", null, "https://example.com/mock-customer-stage/mock-id/tables/mock-key/")] + [TestCase("us-central1", "https://example.com", null, "https://example.com/mock-customer-stage/mock-id/tables/mock-key/")] + [TestCase("us-central1", null, true, "https://storage.us-central1.rep.googleapis.com/mock-customer-stage/mock-id/tables/mock-key/")] + [TestCase("me-central2", null, null, "https://storage.me-central2.rep.googleapis.com/mock-customer-stage/mock-id/tables/mock-key/")] + public void TestUseUriWithRegionsWhenNeeded(string region, string endPoint, bool useRegionalUrl, string expectedRequestUri) + { + var fileMetadata = new SFFileMetadata() + { + stageInfo = new PutGetStageInfo() + { + endPoint = endPoint, + location = Location, + locationType = SFRemoteStorageUtil.GCS_FS, + path = LocationPath, + presignedUrl = null, + region = region, + stageCredentials = _stageCredentials, + storageAccount = null, + useRegionalUrl = useRegionalUrl + } + }; + + // act + var uri = _client.FormBaseRequest(fileMetadata, "PUT").RequestUri.ToString(); + + // assert + Assert.AreEqual(expectedRequestUri, uri); + } + private void AssertForDownloadFileTests(ResultStatus expectedResultStatus) { if (expectedResultStatus == ResultStatus.DOWNLOADED) diff --git a/Snowflake.Data/Core/FileTransfer/StorageClient/SFGCSClient.cs b/Snowflake.Data/Core/FileTransfer/StorageClient/SFGCSClient.cs index f56baf2fa..b51afed36 100644 --- a/Snowflake.Data/Core/FileTransfer/StorageClient/SFGCSClient.cs +++ b/Snowflake.Data/Core/FileTransfer/StorageClient/SFGCSClient.cs @@ -10,6 +10,8 @@ using Newtonsoft.Json; using Snowflake.Data.Log; using System.Net; +using Google.Apis.Storage.v1; +using Google.Cloud.Storage.V1; namespace Snowflake.Data.Core.FileTransfer.StorageClient { @@ -52,6 +54,8 @@ class SFGCSClient : ISFRemoteStorageClient /// private WebRequest _customWebRequest = null; + private static readonly string[] s_scopes = new[] { StorageService.Scope.DevstorageFullControl }; + /// /// GCS client with access token. /// @@ -65,15 +69,32 @@ public SFGCSClient(PutGetStageInfo stageInfo) Logger.Debug("Constructing client using access token"); AccessToken = accessToken; GoogleCredential creds = GoogleCredential.FromAccessToken(accessToken, null); - StorageClient = Google.Cloud.Storage.V1.StorageClient.Create(creds); + var storageClientBuilder = new StorageClientBuilder + { + Credential = creds?.CreateScoped(s_scopes), + EncryptionKey = null + }; + StorageClient = BuildStorageClient(storageClientBuilder, stageInfo); } else { Logger.Info("No access token received from GS, constructing anonymous client with no encryption support"); - StorageClient = Google.Cloud.Storage.V1.StorageClient.CreateUnauthenticated(); + var storageClientBuilder = new StorageClientBuilder + { + UnauthenticatedAccess = true + }; + StorageClient = BuildStorageClient(storageClientBuilder, stageInfo); } } + private Google.Cloud.Storage.V1.StorageClient BuildStorageClient(StorageClientBuilder builder, PutGetStageInfo stageInfo) + { + var gcmCustomEndpoint = stageInfo.GcsCustomEndpoint(); + if (!string.IsNullOrEmpty(gcmCustomEndpoint)) + builder.BaseUri = gcmCustomEndpoint; + return builder.Build(); + } + internal void SetCustomWebRequest(WebRequest mockWebRequest) { _customWebRequest = mockWebRequest; @@ -112,7 +133,7 @@ public RemoteLocation ExtractBucketNameAndPath(string stageLocation) internal WebRequest FormBaseRequest(SFFileMetadata fileMetadata, string method) { string url = string.IsNullOrEmpty(fileMetadata.presignedUrl) ? - generateFileURL(fileMetadata.stageInfo.location, fileMetadata.RemoteFileName()) : + generateFileURL(fileMetadata.stageInfo, fileMetadata.RemoteFileName()) : fileMetadata.presignedUrl; WebRequest request = WebRequest.Create(url); @@ -219,19 +240,26 @@ public async Task GetFileHeaderAsync(SFFileMetadata fileMetadata, Ca return null; } - /// - /// Generate the file URL. - /// - /// The GCS file metadata. - /// The GCS file metadata. - internal string generateFileURL(string stageLocation, string fileName) + internal string generateFileURL(PutGetStageInfo stageInfo, string fileName) { - var gcsLocation = ExtractBucketNameAndPath(stageLocation); + var storageHostPath = ExtractStorageHostPath(stageInfo); + var gcsLocation = ExtractBucketNameAndPath(stageInfo.location); var fullFilePath = gcsLocation.key + fileName; - var link = "https://storage.googleapis.com/" + gcsLocation.bucket + "/" + fullFilePath; + var link = storageHostPath + gcsLocation.bucket + "/" + fullFilePath; return link; } + private string ExtractStorageHostPath(PutGetStageInfo stageInfo) + { + var gcsEndpoint = stageInfo.GcsCustomEndpoint(); + var storageHostPath = string.IsNullOrEmpty(gcsEndpoint) ? "https://storage.googleapis.com/" : gcsEndpoint; + if (!storageHostPath.StartsWith("https://", StringComparison.OrdinalIgnoreCase)) + storageHostPath = "https://" + storageHostPath; + if (!storageHostPath.EndsWith("/")) + storageHostPath = storageHostPath + "/"; + return storageHostPath; + } + /// /// Upload the file to the GCS location. /// diff --git a/Snowflake.Data/Core/RestResponse.cs b/Snowflake.Data/Core/RestResponse.cs index 64275fa42..b490ddcdc 100755 --- a/Snowflake.Data/Core/RestResponse.cs +++ b/Snowflake.Data/Core/RestResponse.cs @@ -8,6 +8,7 @@ using Newtonsoft.Json.Converters; using Newtonsoft.Json.Linq; using Snowflake.Data.Client; +using Snowflake.Data.Core.FileTransfer; namespace Snowflake.Data.Core { @@ -439,6 +440,22 @@ internal class PutGetStageInfo [JsonProperty(PropertyName = "endPoint", NullValueHandling = NullValueHandling.Ignore)] internal string endPoint { get; set; } + + [JsonProperty(PropertyName = "useRegionalUrl", NullValueHandling = NullValueHandling.Ignore)] + internal bool useRegionalUrl { get; set; } + + private const string GcsRegionMeCentral2 = "me-central2"; + + internal string GcsCustomEndpoint() + { + if (!(locationType ?? string.Empty).Equals(SFRemoteStorageUtil.GCS_FS, StringComparison.OrdinalIgnoreCase)) + return null; + if (!string.IsNullOrWhiteSpace(endPoint) && endPoint != "null") + return endPoint; + if (GcsRegionMeCentral2.Equals(region, StringComparison.OrdinalIgnoreCase) || useRegionalUrl) + return $"storage.{region.ToLower()}.rep.googleapis.com"; + return null; + } } internal class PutGetEncryptionMaterial From ded25c2c77af1ae5b0568fd1e4b160e6491083d9 Mon Sep 17 00:00:00 2001 From: Krzysztof Nozderko Date: Thu, 28 Nov 2024 14:34:41 +0100 Subject: [PATCH 2/2] fix typos --- .../UnitTests/PutGetStageInfoTest.cs | 12 ++++++++---- Snowflake.Data.Tests/UnitTests/SFGCSClientTest.cs | 2 +- .../Core/FileTransfer/StorageClient/SFGCSClient.cs | 6 +++--- 3 files changed, 12 insertions(+), 8 deletions(-) diff --git a/Snowflake.Data.Tests/UnitTests/PutGetStageInfoTest.cs b/Snowflake.Data.Tests/UnitTests/PutGetStageInfoTest.cs index 85a34b222..074d95be5 100644 --- a/Snowflake.Data.Tests/UnitTests/PutGetStageInfoTest.cs +++ b/Snowflake.Data.Tests/UnitTests/PutGetStageInfoTest.cs @@ -1,3 +1,7 @@ +/* + * Copyright (c) 2024 Snowflake Computing Inc. All rights reserved. + */ + using System.Collections.Generic; using NUnit.Framework; using Snowflake.Data.Core; @@ -10,16 +14,16 @@ public class PutGetStageInfoTest { [Test] [TestCaseSource(nameof(TestCases))] - public void TestGcmRegionalUrl(string region, bool useRegionalUrl, string endPoint, string expectedGcmEndpoint) + public void TestGcsRegionalUrl(string region, bool useRegionalUrl, string endPoint, string expectedGcsEndpoint) { // arrange - var stageInfo = CreateGCSStageInfo(region, useRegionalUrl, endPoint); + var stageInfo = CreateGcsStageInfo(region, useRegionalUrl, endPoint); // act var gcsCustomEndpoint = stageInfo.GcsCustomEndpoint(); // assert - Assert.AreEqual(expectedGcmEndpoint, gcsCustomEndpoint); + Assert.AreEqual(expectedGcsEndpoint, gcsCustomEndpoint); } internal static IEnumerable TestCases() @@ -41,7 +45,7 @@ internal static IEnumerable TestCases() yield return new object[] { "US-CENTRAL1", true, "example.com", "example.com" }; } - private PutGetStageInfo CreateGCSStageInfo(string region, bool useRegionalUrl, string endPoint) => + private PutGetStageInfo CreateGcsStageInfo(string region, bool useRegionalUrl, string endPoint) => new PutGetStageInfo { locationType = SFRemoteStorageUtil.GCS_FS, diff --git a/Snowflake.Data.Tests/UnitTests/SFGCSClientTest.cs b/Snowflake.Data.Tests/UnitTests/SFGCSClientTest.cs index 599a0b29b..9d336125e 100644 --- a/Snowflake.Data.Tests/UnitTests/SFGCSClientTest.cs +++ b/Snowflake.Data.Tests/UnitTests/SFGCSClientTest.cs @@ -1,5 +1,5 @@ /* - * Copyright (c) 2012-2023 Snowflake Computing Inc. All rights reserved. + * Copyright (c) 2012-2024 Snowflake Computing Inc. All rights reserved. */ using System; diff --git a/Snowflake.Data/Core/FileTransfer/StorageClient/SFGCSClient.cs b/Snowflake.Data/Core/FileTransfer/StorageClient/SFGCSClient.cs index b51afed36..e5d0ac139 100644 --- a/Snowflake.Data/Core/FileTransfer/StorageClient/SFGCSClient.cs +++ b/Snowflake.Data/Core/FileTransfer/StorageClient/SFGCSClient.cs @@ -89,9 +89,9 @@ public SFGCSClient(PutGetStageInfo stageInfo) private Google.Cloud.Storage.V1.StorageClient BuildStorageClient(StorageClientBuilder builder, PutGetStageInfo stageInfo) { - var gcmCustomEndpoint = stageInfo.GcsCustomEndpoint(); - if (!string.IsNullOrEmpty(gcmCustomEndpoint)) - builder.BaseUri = gcmCustomEndpoint; + var gcsCustomEndpoint = stageInfo.GcsCustomEndpoint(); + if (!string.IsNullOrEmpty(gcsCustomEndpoint)) + builder.BaseUri = gcsCustomEndpoint; return builder.Build(); }