dotnet · imback82 · Jan 21, 2021 · Dec 2, 2020 · Dec 2, 2020 · Dec 2, 2020
diff --git a/src/csharp/Extensions/Microsoft.Spark.Extensions.FileSystem.E2ETest/Constants.cs b/src/csharp/Extensions/Microsoft.Spark.Extensions.FileSystem.E2ETest/Constants.cs
@@ -0,0 +1,14 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+namespace Microsoft.Spark.Extensions.FileSystem.E2ETest
+{
+    /// <summary>
+    /// Constants related to the FileSystem test suite.
+    /// </summary>
+    internal class Constants
+    {
+        public const string FileSystemTestContainerName = "FileSystem Tests";
+    }
+}
diff --git a/...harp/Extensions/Microsoft.Spark.Extensions.FileSystem.E2ETest/FileSystemTestCollection.cs b/...harp/Extensions/Microsoft.Spark.Extensions.FileSystem.E2ETest/FileSystemTestCollection.cs
@@ -0,0 +1,17 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using Microsoft.Spark.E2ETest;
+using Xunit;
+
+namespace Microsoft.Spark.Extensions.FileSystem.E2ETest
+{
+    [CollectionDefinition(Constants.FileSystemTestContainerName)]
+    public class FileSystemTestCollection : ICollectionFixture<SparkFixture>
+    {
+        // This class has no code, and is never created. Its purpose is simply
+        // to be the place to apply [CollectionDefinition] and all the
+        // ICollectionFixture<> interfaces.
+    }
+}
diff --git a/src/csharp/Extensions/Microsoft.Spark.Extensions.FileSystem.E2ETest/FileSystemTests.cs b/src/csharp/Extensions/Microsoft.Spark.Extensions.FileSystem.E2ETest/FileSystemTests.cs
@@ -0,0 +1,39 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using System.IO;
+using Microsoft.Spark.E2ETest;
+using Microsoft.Spark.Sql;
+using Microsoft.Spark.UnitTest.TestUtils;
+using Xunit;
+
+namespace Microsoft.Spark.Extensions.FileSystem.E2ETest
+{
+    [Collection(Constants.FileSystemTestContainerName)]
+    public class FileSystemTests
+    {
+        private readonly SparkSession _spark;
+
+        public FileSystemTests(SparkFixture fixture)
+        {
+            _spark = fixture.Spark;
+        }
+
+        /// <summary>
+        /// Test that methods return the expected signature.
+        /// </summary>
+        [Fact]
+        public void TestSignatures()
+        {
+            using FileSystem fs = FileSystem.Get(_spark.SparkContext);
+
+            using var tempDirectory = new TemporaryDirectory();
+            string path = Path.Combine(tempDirectory.Path, "temp-table");
+            _spark.Range(25).Write().Format("parquet").Save(path);
+
+            Assert.True(fs.Delete(path, true));
+            Assert.False(fs.Delete(path, true));
+        }
+    }
+}
diff --git a/....Spark.Extensions.FileSystem.E2ETest/Microsoft.Spark.Extensions.FileSystem.E2ETest.csproj b/....Spark.Extensions.FileSystem.E2ETest/Microsoft.Spark.Extensions.FileSystem.E2ETest.csproj
@@ -0,0 +1,13 @@
+<Project Sdk="Microsoft.NET.Sdk">
+
+  <PropertyGroup>
+    <TargetFramework>netcoreapp3.1</TargetFramework>
+    <IsPackable>false</IsPackable>
+  </PropertyGroup>
+
+  <ItemGroup>
+    <ProjectReference Include="..\..\Microsoft.Spark.E2ETest\Microsoft.Spark.E2ETest.csproj" />
+    <ProjectReference Include="..\..\Microsoft.Spark\Microsoft.Spark.csproj" />
+    <ProjectReference Include="..\Microsoft.Spark.Extensions.FileSystem\Microsoft.Spark.Extensions.FileSystem.csproj" />
+  </ItemGroup>
+</Project>
diff --git a/src/csharp/Extensions/Microsoft.Spark.Extensions.FileSystem/FileSystem.cs b/src/csharp/Extensions/Microsoft.Spark.Extensions.FileSystem/FileSystem.cs
@@ -0,0 +1,51 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using System;
+using Microsoft.Spark.Interop;
+using Microsoft.Spark.Interop.Ipc;
+
+namespace Microsoft.Spark.Extensions.FileSystem
+{
+    /// <summary>
+    /// An abstract base class for a fairly generic filesystem. It may be implemented as a distributed filesystem, or
+    /// as a "local" one that reflects the locally-connected disk. The local version exists for small Hadoop instances
+    /// and for testing.
+    /// 
+    /// All user code that may potentially use the Hadoop Distributed File System should be written to use an FileSystem
+    /// object. The Hadoop DFS is a multi-machine system that appears as a single disk.It's useful because of its fault
+    /// tolerance and potentially very large capacity.
+    /// </summary>
+    public abstract class FileSystem : IDisposable
+    {
+        /// <summary>
+        /// Returns the configured FileSystem implementation.
+        /// </summary>
+        /// <param name="sparkContext">The SparkContext whose configuration will be used.</param>
+        /// <returns>The FileSystem.</returns>
+        public static FileSystem Get(SparkContext sparkContext)
+        {
+            // TODO: Expose hadoopConfiguration as a .NET class and add an override for Get() that takes it.
+            JvmObjectReference hadoopConfiguration = (JvmObjectReference)
+                ((IJvmObjectReferenceProvider)sparkContext).Reference.Invoke("hadoopConfiguration");
+
+            return new JvmReferenceFileSystem(
+                (JvmObjectReference)SparkEnvironment.JvmBridge.CallStaticJavaMethod(
+                    "org.apache.hadoop.fs.FileSystem",
+                    "get",
+                    hadoopConfiguration));
+        }
+
+        /// <summary>
+        /// Delete a file.
+        /// </summary>
+        /// <param name="path">The path to delete.</param>
+        /// <param name="recursive">If path is a directory and set to true, the directory is deleted else throws an
+        /// exception. In case of a file the recursive can be set to either true or false.</param>
+        /// <returns>True if delete is successful else false.</returns>
+        public abstract bool Delete(string path, bool recursive = true);
+
+        public abstract void Dispose();
+    }
+}
diff --git a/src/csharp/Extensions/Microsoft.Spark.Extensions.FileSystem/JvmReferenceFileSystem.cs b/src/csharp/Extensions/Microsoft.Spark.Extensions.FileSystem/JvmReferenceFileSystem.cs
@@ -0,0 +1,44 @@
+// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using Microsoft.Spark.Interop;
+using Microsoft.Spark.Interop.Ipc;
+
+namespace Microsoft.Spark.Extensions.FileSystem
+{
+    /// <summary>
+    /// <see cref="FileSystem"/> implementation that wraps a corresponding FileSystem object in the JVM.
+    /// </summary>
+    public class JvmReferenceFileSystem : FileSystem, IJvmObjectReferenceProvider
+    {
+        private readonly JvmObjectReference _jvmObject;
+
+        internal JvmReferenceFileSystem(JvmObjectReference jvmObject)
+        {
+            _jvmObject = jvmObject;
+        }
+
+        JvmObjectReference IJvmObjectReferenceProvider.Reference => _jvmObject;
+
+        /// <summary>
+        /// Delete a file.
+        /// </summary>
+        /// <param name="path">The path to delete.</param>
+        /// <param name="recursive">If path is a directory and set to true, the directory is deleted else throws an
+        /// exception. In case of a file the recursive can be set to either true or false.</param>
+        /// <returns>True if delete is successful else false.</returns>
+        public override bool Delete(string path, bool recursive = true)
+        {
+            JvmObjectReference pathObject =
+                SparkEnvironment.JvmBridge.CallConstructor("org.apache.hadoop.fs.Path", path);
+
+            return (bool)_jvmObject.Invoke("delete", pathObject, recursive);
+        }
+
+        public override void Dispose()
+        {
+            _jvmObject.Invoke("close");
+        }
+    }
+}
diff --git a/...nsions/Microsoft.Spark.Extensions.FileSystem/Microsoft.Spark.Extensions.FileSystem.csproj b/...nsions/Microsoft.Spark.Extensions.FileSystem/Microsoft.Spark.Extensions.FileSystem.csproj
@@ -0,0 +1,11 @@
+<Project Sdk="Microsoft.NET.Sdk">
+
+  <PropertyGroup>
+    <TargetFramework>netstandard2.0</TargetFramework>
+  </PropertyGroup>
+
+  <ItemGroup>
+    <ProjectReference Include="..\..\Microsoft.Spark\Microsoft.Spark.csproj" />
+  </ItemGroup>
+
+</Project>
diff --git a/src/csharp/Microsoft.Spark.E2ETest/Microsoft.Spark.E2ETest.csproj b/src/csharp/Microsoft.Spark.E2ETest/Microsoft.Spark.E2ETest.csproj
@@ -12,10 +12,12 @@
 
   <ItemGroup>
     <InternalsVisibleTo Include="Microsoft.Spark.Extensions.Delta.E2ETest" />
+    <InternalsVisibleTo Include="Microsoft.Spark.Extensions.FileSystem.E2ETest" />
     <InternalsVisibleTo Include="Microsoft.Spark.Extensions.Hyperspace.E2ETest" />
   </ItemGroup>
 
   <ItemGroup>
+    <ProjectReference Include="..\Extensions\Microsoft.Spark.Extensions.FileSystem\Microsoft.Spark.Extensions.FileSystem.csproj" />
     <ProjectReference Include="..\Microsoft.Spark.E2ETest.ExternalLibrary\Microsoft.Spark.E2ETest.ExternalLibrary.csproj" />
     <ProjectReference Include="..\Microsoft.Spark.Worker\Microsoft.Spark.Worker.csproj" />
     <ProjectReference Include="..\Microsoft.Spark\Microsoft.Spark.csproj" />

diff --git a/src/csharp/Microsoft.Spark.sln b/src/csharp/Microsoft.Spark.sln
@@ -39,6 +39,10 @@ Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Microsoft.Spark.Extensions.
 EndProject
 Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Microsoft.Spark.Extensions.Hyperspace.E2ETest", "Extensions\Microsoft.Spark.Extensions.Hyperspace.E2ETest\Microsoft.Spark.Extensions.Hyperspace.E2ETest.csproj", "{C6019E44-C777-4DE2-B70E-EA025B7D044D}"
 EndProject
+Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "Microsoft.Spark.Extensions.FileSystem", "Extensions\Microsoft.Spark.Extensions.FileSystem\Microsoft.Spark.Extensions.FileSystem.csproj", "{30FC2E08-5944-47B1-9441-90D6D5D91896}"
+EndProject
+Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Microsoft.Spark.Extensions.FileSystem.E2ETest", "Extensions\Microsoft.Spark.Extensions.FileSystem.E2ETest\Microsoft.Spark.Extensions.FileSystem.E2ETest.csproj", "{33DF254A-C238-40D8-9A15-B0CCC4A2CE95}"
+EndProject
 Global
 	GlobalSection(SolutionConfigurationPlatforms) = preSolution
 		Debug|Any CPU = Debug|Any CPU
@@ -101,6 +105,14 @@ Global
 		{C6019E44-C777-4DE2-B70E-EA025B7D044D}.Debug|Any CPU.Build.0 = Debug|Any CPU
 		{C6019E44-C777-4DE2-B70E-EA025B7D044D}.Release|Any CPU.ActiveCfg = Release|Any CPU
 		{C6019E44-C777-4DE2-B70E-EA025B7D044D}.Release|Any CPU.Build.0 = Release|Any CPU
+		{30FC2E08-5944-47B1-9441-90D6D5D91896}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
+		{30FC2E08-5944-47B1-9441-90D6D5D91896}.Debug|Any CPU.Build.0 = Debug|Any CPU
+		{30FC2E08-5944-47B1-9441-90D6D5D91896}.Release|Any CPU.ActiveCfg = Release|Any CPU
+		{30FC2E08-5944-47B1-9441-90D6D5D91896}.Release|Any CPU.Build.0 = Release|Any CPU
+		{33DF254A-C238-40D8-9A15-B0CCC4A2CE95}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
+		{33DF254A-C238-40D8-9A15-B0CCC4A2CE95}.Debug|Any CPU.Build.0 = Debug|Any CPU
+		{33DF254A-C238-40D8-9A15-B0CCC4A2CE95}.Release|Any CPU.ActiveCfg = Release|Any CPU
+		{33DF254A-C238-40D8-9A15-B0CCC4A2CE95}.Release|Any CPU.Build.0 = Release|Any CPU
 	EndGlobalSection
 	GlobalSection(SolutionProperties) = preSolution
 		HideSolutionNode = FALSE
@@ -114,6 +126,8 @@ Global
 		{7BDE09ED-04B3-41B2-A466-3D6F7225291E} = {71A19F75-8279-40AB-BEA0-7D4B153FC416}
 		{70DDA4E9-1195-4A29-9AA1-96A8223A6D4F} = {71A19F75-8279-40AB-BEA0-7D4B153FC416}
 		{C6019E44-C777-4DE2-B70E-EA025B7D044D} = {71A19F75-8279-40AB-BEA0-7D4B153FC416}
+		{30FC2E08-5944-47B1-9441-90D6D5D91896} = {71A19F75-8279-40AB-BEA0-7D4B153FC416}
+		{33DF254A-C238-40D8-9A15-B0CCC4A2CE95} = {71A19F75-8279-40AB-BEA0-7D4B153FC416}
 	EndGlobalSection
 	GlobalSection(ExtensibilityGlobals) = postSolution
 		SolutionGuid = {FD15FFDB-EA1B-436F-841D-3386DDF94538}

diff --git a/src/csharp/Microsoft.Spark/Microsoft.Spark.csproj b/src/csharp/Microsoft.Spark/Microsoft.Spark.csproj
@@ -18,6 +18,8 @@
     <InternalsVisibleTo Include="Microsoft.Spark.Extensions.Delta.E2ETest" />
     <InternalsVisibleTo Include="Microsoft.Spark.Extensions.DotNet.Interactive" />
     <InternalsVisibleTo Include="Microsoft.Spark.Extensions.DotNet.Interactive.UnitTest" />
+    <InternalsVisibleTo Include="Microsoft.Spark.Extensions.FileSystem" />
+    <InternalsVisibleTo Include="Microsoft.Spark.Extensions.FileSystem.E2ETest" />
     <InternalsVisibleTo Include="Microsoft.Spark.Extensions.Hyperspace" />
     <InternalsVisibleTo Include="Microsoft.Spark.Extensions.Hyperspace.E2ETest" />
     <InternalsVisibleTo Include="Microsoft.Spark.UnitTest" />