Add project files.

govert · govert · commit 0f6896d0b6b2 · 2023-12-14T10:40:23.000+02:00
diff --git a/AddIn.cs b/AddIn.cs
@@ -0,0 +1,23 @@
+﻿using ExcelDna.Integration;
+using ExcelDna.IntelliSense;
+using ExcelDna.Registration;
+
+namespace ImportFunctions
+{
+    public class AddIn : IExcelAddIn
+    {
+        public void AutoOpen()
+        {
+            ExcelRegistration.GetExcelFunctions()
+                             .ProcessAsyncRegistrations()
+                             .RegisterFunctions();
+
+            IntelliSenseServer.Install();
+        }
+
+        public void AutoClose()
+        {
+            IntelliSenseServer.Uninstall();
+        }
+    }
+}
diff --git a/Functions.cs b/Functions.cs
@@ -0,0 +1,148 @@
+﻿using System;
+using System.Net;
+using System.Net.Http;
+using System.Text;
+using System.Threading.Tasks;
+using System.Xml;
+using ExcelDna.Integration;
+using ExcelDna.Registration;
+using HtmlAgilityPack;
+
+namespace ImportFunctions
+{
+    public static class Functions
+    {
+        // We will be using the single HttpClient from multiple threads,
+        // which is OK as long as we're not changing the default request headers.
+        static readonly HttpClient _httpClient;
+
+        static Functions()
+        {
+            _httpClient = new HttpClient();
+            ServicePointManager.SecurityProtocol =
+                      SecurityProtocolType.Tls |
+                      SecurityProtocolType.Tls11 |
+                      SecurityProtocolType.Tls12 |
+                      SecurityProtocolType.Tls13;
+        }
+
+        [ExcelAsyncFunction(Description = "Imports data from a given URL using an XPath query")]
+        public static async Task<object> ImportXml(string url, string xpathQuery)
+        {
+            if (string.IsNullOrWhiteSpace(url))
+            {
+                return "Error: URL is required";
+                // return ExcelError.ExcelErrorValue;
+            }
+
+            if (string.IsNullOrWhiteSpace(xpathQuery))
+            {
+                return "Error: XPath query is required";
+                // return ExcelError.ExcelErrorValue;
+            }
+
+            try
+            {
+                var response = await _httpClient.GetStringAsync(url);
+                var doc = new HtmlDocument();
+                doc.LoadHtml(response);
+
+                var node = doc.DocumentNode.SelectSingleNode(xpathQuery);
+                return node?.InnerText ?? "Error: No data found for the given XPath query";
+            }
+            catch (HttpRequestException rex)
+            {
+                return $"Error: Unable to fetch data from the URL - {rex.Message}";
+            }
+            catch (XmlException xex)
+            {
+                return $"Error: Invalid XML data - {xex.Message}";
+            }
+            catch (Exception ex)
+            {
+                return $"Error: {ex.Message}";
+            }
+        }
+
+        [ExcelFunction(Description = "Imports data from a table or list within an HTML page")]
+        public static async Task<object> ImportHtml(
+            [ExcelArgument(Description = "URL of the HTML page to scrape data from. The URL must start with either http or https.")]
+            string url,
+            [ExcelArgument(Description = "Type of data to import. Accepts either 'table' for HTML tables or 'list' for HTML lists (ul/ol).")]
+            string dataType,
+            [ExcelArgument(Description = "Zero-based index of the table or list to import from the HTML page. For example, 0 for the first table/list, 1 for the second, and so on.")]
+            int index)
+        {
+            if (string.IsNullOrWhiteSpace(url))
+            {
+                return "Error: URL is required";
+                // return ExcelError.ExcelErrorValue;
+            }
+
+            if (dataType != "table" && dataType != "list")
+            {
+                return "Error: Data type must be 'table' or 'list'";
+                // return ExcelError.ExcelErrorValue;
+            }
+
+            try
+            {
+                var response = await _httpClient.GetStringAsync(url);
+                var doc = new HtmlDocument();
+                doc.LoadHtml(response);
+
+                if (dataType == "table")
+                    return ExtractTable(doc, index);
+                else
+                    return ExtractList(doc, index);
+            }
+            catch (HttpRequestException rex)
+            {
+                return $"Error: Unable to fetch data from the URL - {rex.Message}";
+            }
+            catch (Exception ex)
+            {
+                return $"Error: {ex.Message}";
+            }
+        }
+
+        static object ExtractTable(HtmlDocument doc, int index)
+        {
+            var tables = doc.DocumentNode.SelectNodes("//table");
+            if (tables == null || tables.Count <= index)
+                return "Error: Table not found";
+
+            var table = tables[index];
+            var sb = new StringBuilder();
+
+            foreach (var row in table.SelectNodes("tr"))
+            {
+                foreach (var cell in row.SelectNodes("th|td"))
+                {
+                    sb.Append(cell.InnerText.Trim());
+                    sb.Append("\t"); // Tab-separated values
+                }
+                sb.AppendLine(); // New line at the end of each row
+            }
+
+            return sb.ToString();
+        }
+
+        static object ExtractList(HtmlDocument doc, int index)
+        {
+            var lists = doc.DocumentNode.SelectNodes("//ul | //ol");
+            if (lists == null || lists.Count <= index)
+                return "Error: List not found";
+
+            var list = lists[index];
+            var sb = new StringBuilder();
+
+            foreach (var item in list.SelectNodes("li"))
+            {
+                sb.AppendLine(item.InnerText.Trim());
+            }
+
+            return sb.ToString();
+        }
+    }
+}
diff --git a/ImportFunctions-Example.xlsx b/ImportFunctions-Example.xlsx
diff --git a/ImportFunctions.csproj b/ImportFunctions.csproj
@@ -0,0 +1,27 @@
+<Project Sdk="Microsoft.NET.Sdk">
+
+  <PropertyGroup>
+    <TargetFramework>net48</TargetFramework>
+
+    <AssemblyTitle>Excel-DNA ImportFunctions Add-In</AssemblyTitle>
+    <Product>ExcelDna.ImportFunctions</Product>
+
+    <ExcelAddInExplicitRegistration>true</ExcelAddInExplicitRegistration>
+
+    <ExcelDnaPackXllSuffix></ExcelDnaPackXllSuffix>
+    <ExcelDnaPack32BitXllName>ExcelDna.ImportFunctions32</ExcelDnaPack32BitXllName>
+    <ExcelDnaPack64BitXllName>ExcelDna.ImportFunctions64</ExcelDnaPack64BitXllName>
+  </PropertyGroup>
+
+  <ItemGroup>
+    <PackageReference Include="ExcelDna.AddIn" Version="1.7.0" />
+    <PackageReference Include="ExcelDna.IntelliSense" Version="1.7.0" />
+    <PackageReference Include="ExcelDna.Registration" Version="1.7.0" />
+    <PackageReference Include="HtmlAgilityPack" Version="1.11.55" />
+  </ItemGroup>
+
+  <ItemGroup>
+    <Reference Include="System.Net.Http" />
+  </ItemGroup>
+  
+</Project>
diff --git a/ImportFunctions.sln b/ImportFunctions.sln
@@ -0,0 +1,25 @@
+﻿
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio Version 17
+VisualStudioVersion = 17.8.34316.72
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "ImportFunctions", "ImportFunctions.csproj", "{72EA066C-B79A-48CC-B418-696C790298D5}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Any CPU = Debug|Any CPU
+		Release|Any CPU = Release|Any CPU
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{72EA066C-B79A-48CC-B418-696C790298D5}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
+		{72EA066C-B79A-48CC-B418-696C790298D5}.Debug|Any CPU.Build.0 = Debug|Any CPU
+		{72EA066C-B79A-48CC-B418-696C790298D5}.Release|Any CPU.ActiveCfg = Release|Any CPU
+		{72EA066C-B79A-48CC-B418-696C790298D5}.Release|Any CPU.Build.0 = Release|Any CPU
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+	GlobalSection(ExtensibilityGlobals) = postSolution
+		SolutionGuid = {05982616-29F8-46D5-9E6B-090ACF9CA379}
+	EndGlobalSection
+EndGlobal
diff --git a/Properties/launchSettings.json b/Properties/launchSettings.json
@@ -0,0 +1,9 @@
+{
+  "profiles": {
+    "Excel": {
+      "commandName": "Executable",
+      "executablePath": "C:\\Program Files\\Microsoft Office\\root\\Office16\\EXCEL.EXE",
+      "commandLineArgs": "/x \"ImportFunctions-AddIn64.xll\""
+    }
+  }
+}