From ffd97e97cbc9d30fe9159955d04b04c24213ee84 Mon Sep 17 00:00:00 2001
From: Martin Othamar <martin@othamar.net>
Date: Sun, 9 Jul 2023 20:47:59 +0200
Subject: [PATCH] More vectorization of Shishua, .NET 8, use standard
 intrinsics API (#1)

---
 .github/workflows/build.yml                   |    2 +-
 .vscode/settings.json                         |    3 +
 Fast.PRNGs.sln                                |   50 +-
 README.md                                     |    8 +-
 .../Fast.PRNGs.Benchmarks.csproj              |    2 +-
 .../Internals/ToDoubleBenchmarks.cs           |   30 +
 .../Fast.PRNGs.Benchmarks/PRNGsScaling.cs     |   56 +-
 .../SimpleBenchConfig.cs                      |   13 +
 .../Fast.PRNGs.Benchmarks/ThroughputColumn.cs |   41 +
 global.json                                   |    7 +-
 img/perf-scaling-2.png                        |  Bin 0 -> 65195 bytes
 src/External/Directory.Build.props            |    8 -
 .../RawIntrinsics/AVX.ManuallyAdded.cs        |   25 -
 src/External/RawIntrinsics/AVX.cs             | 1336 -------------
 src/External/RawIntrinsics/AVX2.cs            | 1726 -----------------
 src/External/RawIntrinsics/FMA.cs             |  326 ----
 .../RawIntrinsics/MMX.ManuallyAdded.cs        |   11 -
 src/External/RawIntrinsics/MMX.cs             |   65 -
 src/External/RawIntrinsics/Other.cs           |  101 -
 .../RawIntrinsics/RawIntrinsics.csproj        |    8 -
 .../RawIntrinsics/SSE.ManuallyAdded.cs        |   11 -
 src/External/RawIntrinsics/SSE.cs             |  766 --------
 .../RawIntrinsics/SSE2.ManuallyAdded.cs       |   17 -
 src/External/RawIntrinsics/SSE2.cs            | 1714 ----------------
 src/External/RawIntrinsics/SSE3.cs            |  100 -
 src/External/RawIntrinsics/SSE41.cs           |  525 -----
 src/External/RawIntrinsics/SSE42.cs           |   15 -
 src/External/RawIntrinsics/SSSE3.cs           |  148 --
 src/External/RawIntrinsics/Types.cs           |  178 --
 .../RawIntrinsics/Utils.ManuallyAdded.cs      |    7 -
 .../RawIntrinsicsGenerator/Generator.cs       |  556 ------
 .../RawIntrinsicsGenerator/Program.cs         |   16 -
 .../RawIntrinsicsGenerator.csproj             |   16 -
 src/Fast.PRNGs/Common.cs                      |   36 +-
 src/Fast.PRNGs/Fast.PRNGs.csproj              |    6 +-
 src/Fast.PRNGs/MWC256.cs                      |   10 +-
 src/Fast.PRNGs/Shishua.cs                     |  130 +-
 src/Fast.PRNGs/Splitmix64.cs                  |   10 +-
 src/Fast.PRNGs/Xoroshiro128Plus.cs            |   11 +-
 src/Fast.PRNGs/Xoshiro256Plus.cs              |   10 +-
 test/Fast.PRNGs.Tests/Fast.PRNGs.Tests.csproj |    2 +-
 test/Fast.PRNGs.Tests/ShishuaTests.cs         |   21 +-
 42 files changed, 298 insertions(+), 7825 deletions(-)
 create mode 100644 .vscode/settings.json
 create mode 100644 benchmark/Fast.PRNGs.Benchmarks/Internals/ToDoubleBenchmarks.cs
 create mode 100644 benchmark/Fast.PRNGs.Benchmarks/SimpleBenchConfig.cs
 create mode 100644 benchmark/Fast.PRNGs.Benchmarks/ThroughputColumn.cs
 create mode 100644 img/perf-scaling-2.png
 delete mode 100644 src/External/Directory.Build.props
 delete mode 100644 src/External/RawIntrinsics/AVX.ManuallyAdded.cs
 delete mode 100644 src/External/RawIntrinsics/AVX.cs
 delete mode 100644 src/External/RawIntrinsics/AVX2.cs
 delete mode 100644 src/External/RawIntrinsics/FMA.cs
 delete mode 100644 src/External/RawIntrinsics/MMX.ManuallyAdded.cs
 delete mode 100644 src/External/RawIntrinsics/MMX.cs
 delete mode 100644 src/External/RawIntrinsics/Other.cs
 delete mode 100644 src/External/RawIntrinsics/RawIntrinsics.csproj
 delete mode 100644 src/External/RawIntrinsics/SSE.ManuallyAdded.cs
 delete mode 100644 src/External/RawIntrinsics/SSE.cs
 delete mode 100644 src/External/RawIntrinsics/SSE2.ManuallyAdded.cs
 delete mode 100644 src/External/RawIntrinsics/SSE2.cs
 delete mode 100644 src/External/RawIntrinsics/SSE3.cs
 delete mode 100644 src/External/RawIntrinsics/SSE41.cs
 delete mode 100644 src/External/RawIntrinsics/SSE42.cs
 delete mode 100644 src/External/RawIntrinsics/SSSE3.cs
 delete mode 100644 src/External/RawIntrinsics/Types.cs
 delete mode 100644 src/External/RawIntrinsics/Utils.ManuallyAdded.cs
 delete mode 100644 src/External/RawIntrinsicsGenerator/Generator.cs
 delete mode 100644 src/External/RawIntrinsicsGenerator/Program.cs
 delete mode 100644 src/External/RawIntrinsicsGenerator/RawIntrinsicsGenerator.csproj

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index ae0c2b8..ba390cd 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -18,7 +18,7 @@ jobs:
     - name: Setup .NET Core
       uses: actions/setup-dotnet@v1
       with:
-        dotnet-version: '7.0.x'
+        dotnet-version: '8.0.100-preview.5.23303.2'
 
     - name: Install dependencies
       run: dotnet restore
diff --git a/.vscode/settings.json b/.vscode/settings.json
new file mode 100644
index 0000000..2ed6265
--- /dev/null
+++ b/.vscode/settings.json
@@ -0,0 +1,3 @@
+{
+    "dotnet.defaultSolution": "Fast.PRNGs.sln"
+}
diff --git a/Fast.PRNGs.sln b/Fast.PRNGs.sln
index c78b6ae..9077a5f 100644
--- a/Fast.PRNGs.sln
+++ b/Fast.PRNGs.sln
@@ -7,58 +7,30 @@ Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "src", "src", "{B56AF188-D99
 EndProject
 Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "test", "test", "{82A9760F-251B-4220-9263-153755FA2EC3}"
 EndProject
-Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "External", "External", "{12A7C294-6EF5-4FDF-A2BA-A01E320B9C36}"
-	ProjectSection(SolutionItems) = preProject
-		src\External\Directory.Build.props = src\External\Directory.Build.props
-	EndProjectSection
-EndProject
-Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "RawIntrinsics", "src\External\RawIntrinsics\RawIntrinsics.csproj", "{BA5145CD-6180-4BA3-817F-197158280327}"
-EndProject
-Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "RawIntrinsicsGenerator", "src\External\RawIntrinsicsGenerator\RawIntrinsicsGenerator.csproj", "{A161A378-55BF-48D2-84FF-DA3F09EA5258}"
-EndProject
 Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "_files", "_files", "{3D9E2A5B-D3F0-49AB-BEC3-647C5063537C}"
 	ProjectSection(SolutionItems) = preProject
-		Directory.Build.props = Directory.Build.props
-		global.json = global.json
-		Fast.PRNGs.sln = Fast.PRNGs.sln
 		.editorconfig = .editorconfig
-		.gitignore = .gitignore
 		.gitattributes = .gitattributes
+		.gitignore = .gitignore
+		Directory.Build.props = Directory.Build.props
+		Fast.PRNGs.sln = Fast.PRNGs.sln
+		global.json = global.json
 	EndProjectSection
 EndProject
-Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "Fast.PRNGs", "src\Fast.PRNGs\Fast.PRNGs.csproj", "{AE271FFA-B5D2-40D8-92E4-71D970142F6D}"
+Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Fast.PRNGs", "src\Fast.PRNGs\Fast.PRNGs.csproj", "{AE271FFA-B5D2-40D8-92E4-71D970142F6D}"
 EndProject
-Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "Fast.PRNGs.Tests", "test\Fast.PRNGs.Tests\Fast.PRNGs.Tests.csproj", "{732E59B8-C209-495B-8608-77E746A68F22}"
+Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Fast.PRNGs.Tests", "test\Fast.PRNGs.Tests\Fast.PRNGs.Tests.csproj", "{732E59B8-C209-495B-8608-77E746A68F22}"
 EndProject
 Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "benchmark", "benchmark", "{089CE6DA-C860-48D3-95D2-353C7A71C9CD}"
 EndProject
-Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "Fast.PRNGs.Benchmarks", "benchmark\Fast.PRNGs.Benchmarks\Fast.PRNGs.Benchmarks.csproj", "{2A875B02-B84C-43A3-BF16-593F5E6276BC}"
+Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Fast.PRNGs.Benchmarks", "benchmark\Fast.PRNGs.Benchmarks\Fast.PRNGs.Benchmarks.csproj", "{2A875B02-B84C-43A3-BF16-593F5E6276BC}"
 EndProject
 Global
 	GlobalSection(SolutionConfigurationPlatforms) = preSolution
 		Debug|Any CPU = Debug|Any CPU
 		Release|Any CPU = Release|Any CPU
 	EndGlobalSection
-	GlobalSection(SolutionProperties) = preSolution
-		HideSolutionNode = FALSE
-	EndGlobalSection
-	GlobalSection(NestedProjects) = preSolution
-		{12A7C294-6EF5-4FDF-A2BA-A01E320B9C36} = {B56AF188-D999-4444-AE68-4971A573FAA4}
-		{BA5145CD-6180-4BA3-817F-197158280327} = {12A7C294-6EF5-4FDF-A2BA-A01E320B9C36}
-		{A161A378-55BF-48D2-84FF-DA3F09EA5258} = {12A7C294-6EF5-4FDF-A2BA-A01E320B9C36}
-		{AE271FFA-B5D2-40D8-92E4-71D970142F6D} = {B56AF188-D999-4444-AE68-4971A573FAA4}
-		{732E59B8-C209-495B-8608-77E746A68F22} = {82A9760F-251B-4220-9263-153755FA2EC3}
-		{2A875B02-B84C-43A3-BF16-593F5E6276BC} = {089CE6DA-C860-48D3-95D2-353C7A71C9CD}
-	EndGlobalSection
 	GlobalSection(ProjectConfigurationPlatforms) = postSolution
-		{BA5145CD-6180-4BA3-817F-197158280327}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
-		{BA5145CD-6180-4BA3-817F-197158280327}.Debug|Any CPU.Build.0 = Debug|Any CPU
-		{BA5145CD-6180-4BA3-817F-197158280327}.Release|Any CPU.ActiveCfg = Release|Any CPU
-		{BA5145CD-6180-4BA3-817F-197158280327}.Release|Any CPU.Build.0 = Release|Any CPU
-		{A161A378-55BF-48D2-84FF-DA3F09EA5258}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
-		{A161A378-55BF-48D2-84FF-DA3F09EA5258}.Debug|Any CPU.Build.0 = Debug|Any CPU
-		{A161A378-55BF-48D2-84FF-DA3F09EA5258}.Release|Any CPU.ActiveCfg = Release|Any CPU
-		{A161A378-55BF-48D2-84FF-DA3F09EA5258}.Release|Any CPU.Build.0 = Release|Any CPU
 		{AE271FFA-B5D2-40D8-92E4-71D970142F6D}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
 		{AE271FFA-B5D2-40D8-92E4-71D970142F6D}.Debug|Any CPU.Build.0 = Debug|Any CPU
 		{AE271FFA-B5D2-40D8-92E4-71D970142F6D}.Release|Any CPU.ActiveCfg = Release|Any CPU
@@ -72,4 +44,12 @@ Global
 		{2A875B02-B84C-43A3-BF16-593F5E6276BC}.Release|Any CPU.ActiveCfg = Release|Any CPU
 		{2A875B02-B84C-43A3-BF16-593F5E6276BC}.Release|Any CPU.Build.0 = Release|Any CPU
 	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+	GlobalSection(NestedProjects) = preSolution
+		{AE271FFA-B5D2-40D8-92E4-71D970142F6D} = {B56AF188-D999-4444-AE68-4971A573FAA4}
+		{732E59B8-C209-495B-8608-77E746A68F22} = {82A9760F-251B-4220-9263-153755FA2EC3}
+		{2A875B02-B84C-43A3-BF16-593F5E6276BC} = {089CE6DA-C860-48D3-95D2-353C7A71C9CD}
+	EndGlobalSection
 EndGlobal
diff --git a/README.md b/README.md
index 0cab574..638bf73 100644
--- a/README.md
+++ b/README.md
@@ -38,11 +38,5 @@ NOTE - MWC256 is likely poorly implemented (it is supposed to be faster). As see
 This is clear from the generated assembly atm but I'm not sure why those branching instructions are generated. `UInt128` support is pretty new
 so maybe there are some inefficiencies there.
 
-![Scaling iterations](/img/perf-scaling.png "Scaling iterations")
-
-#### With hardware counters
-
-Instrumented with more diagnostics, including hardware counters
-
-![With hardware counters](/img/perf-hardwarecounters.png "With hardware counters")
+![Scaling iterations](/img/perf-scaling-2.png "Scaling iterations")
 
diff --git a/benchmark/Fast.PRNGs.Benchmarks/Fast.PRNGs.Benchmarks.csproj b/benchmark/Fast.PRNGs.Benchmarks/Fast.PRNGs.Benchmarks.csproj
index 03ae3ed..deed779 100644
--- a/benchmark/Fast.PRNGs.Benchmarks/Fast.PRNGs.Benchmarks.csproj
+++ b/benchmark/Fast.PRNGs.Benchmarks/Fast.PRNGs.Benchmarks.csproj
@@ -2,7 +2,7 @@
   <PropertyGroup>
     <OutputType>Exe</OutputType>
     <LangVersion>latest</LangVersion>
-    <TargetFramework>net7.0</TargetFramework>
+    <TargetFramework>net8.0</TargetFramework>
     <Nullable>disable</Nullable>
     <DebugType>pdbonly</DebugType>
     <DebugSymbols>true</DebugSymbols>
diff --git a/benchmark/Fast.PRNGs.Benchmarks/Internals/ToDoubleBenchmarks.cs b/benchmark/Fast.PRNGs.Benchmarks/Internals/ToDoubleBenchmarks.cs
new file mode 100644
index 0000000..fbf1e22
--- /dev/null
+++ b/benchmark/Fast.PRNGs.Benchmarks/Internals/ToDoubleBenchmarks.cs
@@ -0,0 +1,30 @@
+namespace Fast.PRNGs.Benchmarks.Internals;
+
+[ConfigSource]
+public class ToDoublesBenchmark
+{
+    internal const ulong DoubleMask = (1L << 53) - 1;
+    internal const double Norm53 = 1.0d / (1L << 53);
+
+    [Params(31512512431231UL)]
+    public ulong Value { get; set; }
+
+    [Benchmark]
+    public double Original()
+    {
+        return (Value & DoubleMask) * Norm53;
+    }
+
+    [Benchmark]
+    public double New()
+    {
+        return (Value >> 11) * (1.0 / (1ul << 53));
+    }
+
+    private class ConfigSourceAttribute : Attribute, IConfigSource
+    {
+        public IConfig Config { get; }
+
+        public ConfigSourceAttribute() => Config = new SimpleBenchConfig(8);
+    }
+}
diff --git a/benchmark/Fast.PRNGs.Benchmarks/PRNGsScaling.cs b/benchmark/Fast.PRNGs.Benchmarks/PRNGsScaling.cs
index 1ce48d5..2e2d785 100644
--- a/benchmark/Fast.PRNGs.Benchmarks/PRNGsScaling.cs
+++ b/benchmark/Fast.PRNGs.Benchmarks/PRNGsScaling.cs
@@ -1,22 +1,31 @@
+using BenchmarkDotNet.Environments;
+using System.Runtime.Intrinsics;
+
 namespace Fast.PRNGs.Benchmarks;
 
-[Config(typeof(Config))]
+[ConfigSource]
 public class PRNGsScaling
 {
+    private const int _iterations = 1 << 17;
+    
     private Random _random;
-    private Shishua _shishua;
+    private Shishua _shishuaSeq;
+    private Shishua _shishuaVec256;
+    private Shishua _shishuaVec512;
     private Xoroshiro128Plus _xoroshiro128plus;
     private Xoshiro256Plus _xoshiro256plus;
     private MWC256 _mwc256;
 
-    [Params(100_000, 1_000_000)]
+    [Params(_iterations)]
     public int Iterations { get; set; }
 
     [GlobalSetup]
     public void Setup()
     {
         _random = new Random();
-        _shishua = Shishua.Create();
+        _shishuaSeq = Shishua.Create();
+        _shishuaVec256 = Shishua.Create();
+        _shishuaVec512 = Shishua.Create();
         _xoroshiro128plus = Xoroshiro128Plus.Create();
         _xoshiro256plus = Xoshiro256Plus.Create();
         _mwc256 = MWC256.Create();
@@ -25,7 +34,9 @@ public void Setup()
     [GlobalCleanup]
     public void Cleanup()
     {
-        _shishua.Dispose();
+        _shishuaSeq.Dispose();
+        _shishuaVec256.Dispose();
+        _shishuaVec512.Dispose();
     }
 
     [Benchmark(Baseline = true)]
@@ -38,10 +49,30 @@ public double SystemRandomGen()
     }
 
     [Benchmark]
-    public double ShishuaGen()
+    public double ShishuaSeqGen()
     {
         for (int i = 0; i < Iterations; i++)
-            _ = _shishua.NextDouble();
+            _ = _shishuaSeq.NextDouble();
+
+        return default;
+    }
+
+    [Benchmark]
+    public double ShishuaVec256Gen()
+    {
+        Vector256<double> result = default;
+        for (int i = 0; i < Iterations; i += 4)
+            _shishuaVec256.NextDoubles256(ref result);
+
+        return default;
+    }
+
+    [Benchmark]
+    public double ShishuaVec512Gen()
+    {
+        Vector512<double> result = default;
+        for (int i = 0; i < Iterations; i += 8)
+            _shishuaVec512.NextDoubles512(ref result);
 
         return default;
     }
@@ -73,13 +104,10 @@ public double MWC256Gen()
         return default;
     }
 
-    private sealed class Config : ManualConfig
+    private class ConfigSourceAttribute : Attribute, IConfigSource
     {
-        public Config()
-        {
-            this.SummaryStyle = SummaryStyle.Default.WithRatioStyle(RatioStyle.Trend);
-            this.AddColumn(RankColumn.Arabic);
-            this.Orderer = new DefaultOrderer(SummaryOrderPolicy.SlowestToFastest, MethodOrderPolicy.Declared);
-        }
+        public IConfig Config { get; }
+
+        public ConfigSourceAttribute() => Config = new SimpleBenchConfig(_iterations * sizeof(double));
     }
 }
diff --git a/benchmark/Fast.PRNGs.Benchmarks/SimpleBenchConfig.cs b/benchmark/Fast.PRNGs.Benchmarks/SimpleBenchConfig.cs
new file mode 100644
index 0000000..c996b37
--- /dev/null
+++ b/benchmark/Fast.PRNGs.Benchmarks/SimpleBenchConfig.cs
@@ -0,0 +1,13 @@
+namespace Fast.PRNGs.Benchmarks;
+
+internal sealed class SimpleBenchConfig : ManualConfig
+{
+    public SimpleBenchConfig(ulong? byteSizePerIteration = null)
+    {
+        this.SummaryStyle = SummaryStyle.Default.WithRatioStyle(RatioStyle.Trend);
+        this.AddColumn(RankColumn.Arabic);
+        this.Orderer = new DefaultOrderer(SummaryOrderPolicy.SlowestToFastest, MethodOrderPolicy.Declared);
+        if (byteSizePerIteration != null)
+            this.AddColumn(new ThroughputColumn(byteSizePerIteration.Value));
+    }
+}
diff --git a/benchmark/Fast.PRNGs.Benchmarks/ThroughputColumn.cs b/benchmark/Fast.PRNGs.Benchmarks/ThroughputColumn.cs
new file mode 100644
index 0000000..be54912
--- /dev/null
+++ b/benchmark/Fast.PRNGs.Benchmarks/ThroughputColumn.cs
@@ -0,0 +1,41 @@
+using BenchmarkDotNet.Running;
+
+namespace Fast.PRNGs.Benchmarks;
+
+public class ThroughputColumn : IColumn
+{
+    public string Id { get; }
+
+    public string ColumnName { get; }
+
+    private readonly ulong _byteSizePerIteration;
+
+    public ThroughputColumn(ulong byteSizePerIteration)
+    {
+        ColumnName = "Throughput";
+        Id = nameof(TagColumn) + "." + ColumnName;
+
+        _byteSizePerIteration = byteSizePerIteration;
+    }
+
+    public bool IsDefault(Summary summary, BenchmarkCase benchmarkCase) => false;
+    public string GetValue(Summary summary, BenchmarkCase benchmarkCase)
+    {
+        var stats = summary[benchmarkCase].ResultStatistics;
+        if (stats is null || stats.Mean == default || double.IsNaN(stats.Mean))
+            return "?";
+
+        var gbs = (_byteSizePerIteration / 1e9d) / (stats.Mean / 1e9d);
+        return $"{gbs:0.00} GB/s";
+    }
+
+    public bool IsAvailable(Summary summary) => true;
+    public bool AlwaysShow => true;
+    public ColumnCategory Category => ColumnCategory.Metric;
+    public int PriorityInCategory => 0;
+    public bool IsNumeric => true;
+    public UnitType UnitType => UnitType.Size;
+    public string Legend => $"Throughput in GB/s";
+    public string GetValue(Summary summary, BenchmarkCase benchmarkCase, SummaryStyle style) => GetValue(summary, benchmarkCase);
+    public override string ToString() => ColumnName;
+}
diff --git a/global.json b/global.json
index 3672f82..717bcdd 100644
--- a/global.json
+++ b/global.json
@@ -1,6 +1,7 @@
 {
   "sdk": {
-    "version": "7.0.201",
-    "rollForward": "latestFeature"
+    "version": "8.0.100-preview.5.23303.2",
+    "rollForward": "latestFeature",
+    "allowPrerelease": true
   }
-}
\ No newline at end of file
+}
diff --git a/img/perf-scaling-2.png b/img/perf-scaling-2.png
new file mode 100644
index 0000000000000000000000000000000000000000..89561cbbaf642ba129775737e12b4a421b850571
GIT binary patch
literal 65195
zcmeFYWmuG58}}=s14^p5Gz^G{bV`Q|N=gVwNDB<z%`hO6N{4i(NOyO~&|O1HGxPuh
z%sbxoJkPhikM}tCr~Lt#xn@{bthLVbT)+Q+eN|SJCU{8k@Xnn(1hO)3RPNll7k1|k
zRtGKsa|HDLeF)|cmZOR^=uYtv)i&nMJyQt<i92`7!tt&R?_=ISu#?epymN=J<M$6%
zkL?fRJ9lnh%f69NbJN>vdJs?5<&M^GD9|;}c?tqOj(ZKFrSq%pgwB5E>ehKNLu}R4
z$=7CY<<)##^Yuo+k9hUuE77We*ebmkCn28%6~JiF@F0nnkenEo`0jJ|3`o`74KfeB
zw79gCny@pQx|pztFirFF$jz&+|G8B2bIGIOXMKKFR#wjgIzM6%?w`LR)9c(w{(g-)
zkO_34`p>69YU=`z|MOvful@6X|B+55a!uy1Hhwph{j4YQpEl|IWZs6+|JOObQAz)&
zm1j={!~WCC8|ME#;ZFxD>Zz(06!MJp!ch>^@n08nmBrjMT9!oQI9{JuYcFaPtTFb0
zfbl;~?S$usg@vWAZqmk!o_-DW-cPmmYD?k2E$Ax1en7ylmRx&jR^vT=m*0DU3Jryh
z1CXx=vJR%LH5xv^N-iz`bA_4VgFIpJZ|}9(Hch6<KccXC>E^wee}J8I+pe%X+r7y5
zOU(7de5j4=fQsvzX{>|m(6qyf%>P`-8*gryfW^eD)Lw<3<JPJ@djEjT(fjD9Bg%Sq
zJPl~&K9T1C@3VRXOrVn9w7u~5%AY3c*4weMYRYnRrp;IZmDV=T-QN7977^D&e&BD;
zYx?97pWx)M$#vkv6<%8sit=dzD{{tGL*3flo8Sp`l@O#ABH}8o+H!$#asG<@ogb>d
z7EzZks`{l}bo4kRslkNQb>SC1qytNlA8gq*Zn@19R3dsMoNcL(_Kq1n&LwTi!XL6l
z=Z3>yZoD1<(H#HhDvgL6)d)5LgxFLR8_66QE6frirHz*i2;(-oFXJ6lELyGZ*uYt*
zTw&KWttOsOKu7z_FmZnI{c#tm&963c!_N_R?GpY*y|@no9ZmBN_Mrl?qmfGqi^5l@
zt3S9?&Apb;x0(adx2RFwKo99LkD9hPev?iwg-#;JdeciD<<uDJ7L7IDepQ-(`^gOd
z3$^rMkdGXM#6N%qCoBbz-*av_B4M;C#kKs}WK;H5c(YJv@=Dqj$|WjbIW&J*BgPIs
zR2wM&wQ(T4=Jjh>K;_nPk7LpLZQ$TUYTqq>#){^cbgh21?#giNlD{rgk)2BHy18=0
z9Zj7_5cd2wu7mH=t8z<o&Qacw-cGaBq*z>oNB*U)`@i!blMB~@ifjH}AYRy4xr$Iw
z`-e{{+6d}r!~7+774@bUmV>>9FNS#D=E;)C42SpV{fe_GYYd(h6wr+?>KH4qn3<`}
zzsUbAXdUGjz!PuS>Ej6KZm_>i23)pA#;m8tqE9ycb@8sr2kk4fH_W|<KuiDAN9zLR
zT5tG6>&AZ%+v3Npi|usngXB~%2Pd$=t2*Nz(P$llPKf(F;%1NP{1Pj6vMbJ)07sxq
ztmcURV62K11&tI~9axk*vN+l8Qo3mqG#Qu-oArzjPxEwWN;I*kiVFO9NbDqi3(LA-
z&D8E$&~6lp7_rOvJ;Bfqq2S5uOzTMa$!5XsFw3own_c>hp2WPf(%I(9DuS;GK1}$@
zeGX0O?IT>V_QWe-*r0U7q9W5l*la-T_QZg%qPR-r-?{YOTg{28%k<I8AIxvfYLzu@
zx(dl574gvG03utVCRayOUoC;^y`7w28rOoM8FtKEl(;lhCz`giq5I}%n-*mo7JEvS
z1F<RBn-;P8<nH~F|Mpa<gjUa}9gOep>gxB4Y7LcZM-t6|0M%eviWXsaz>GlD5d7jn
z%icFF>1xm5npms~Z`=;b8O6B;<Q3|p;Xr>a<2HRtwVL%(tS%%)Z`~j6$|m&1WoN0)
zd$aWsN#HTPUhxT-zgeT=9jsUWzXmN;zff3!W%c{iWmZFR`s9}ahBL%Tr^OZ?lN>l}
zY^DIix^5aVzm>^L^s964Z!J?{X_Ys*(|wXx-De?ZNR#ck`c*GbsXS8g)-@@^ctsF=
zYK182!rZ7pFQDR`!oT;I75#TK^jeNtcHR~E!cOICFB_<ACct${O9@t2*fMw3Cr665
z^i}=arEgv`P)oNy&L>}-*U*XjgF+FXpw~zd$%>4H;nbOnsxC|x@n6;S{U;_HXB4i<
z@V;pLf-Vt)Z^TxzIwPw@o&~1<+u~2q|0DvruIVGZe-lH{=-2<}iQ)hAO!WVsaFp}9
zYcy#wP-&ah>&aQ`Ba~BJT5`+Ke${;J>QlOaR9C9<*<HF#DRB0>Q6*j7D?l20L<+f$
zv}X2t0>X{-4{)KnS%mP_SvFTq>0Z=Oe$&_q_E1VA4!uYCt;K!%1@gd1Xb}=VFzxPF
zrlfn5#!<qe_lS-*S}D1%Pr=O9rp-z)tn<)*uT9tHDu#w%Y^>||spyp`GN3eH9V#5c
zf#&B{X0<C|RQ{q(ccqQ%o<!1y$YW3tv)Rtp))tc&P3yFHT^kIZgElaj{RVcOmo!=^
zDYj+NBNww9Om^x7yQ0_F4z3Z?`nJ@G&BlTy^CRoAtd=g*@W~w;R0~&E!DL&j%{CtF
zpi2XAg}a8l2}D#jbSYI`47=P6h?8ra-3%<&kQfkq9<D2T>%UeixmGPeLDd2#LCN08
z0|gtjXti5H^3mmkF8zmxsC;Q_7aSM|S;*(Yg71{wq`rr|7Da1=B!b($u%?Zg<Ej^F
z;l`pph83L5MB|kG8*Pjq7nDjY2A*32?mU@;$nB6R-IpEU@S2`V0`#MTflFK6;k)+Y
zA9-Cyoaw{9LlcvCQ{+4>`~vX&FPd+V{%vjOC0=EXkO<V{7sFRcrk*6zUXC?xDQr0>
z87ufs2Zt}AF?b^9?}D|R9QEfTUx~GEvcct!-Z%HWy(|?`9^zk^-#McTMPDp<ASaGV
zT({4P^4)tW(hSey4uR-7H*YrEI<1zAdCK{P@RGf8XF#8UwU&Ba7x_D}*7n$ORO0|c
zf_Ijh`v*zAeVz>!yoTorHW3=$<PV34lb@NN-*wN^XCO$st~pOf8Ie+z*-FHL5i|QI
zktD8WwI3s@njg^!f0`m(tlP>Z28F!%;=wNTxxm)anSWt?Cs*OX-rE_J=lU(kv&<oP
zyu&Ux+SFXJ%Aod9k1!F7)7FN-d3wJgsLui3*h<{WnTfBU#I?@3_0wlV8ULI0ooIkB
zGnMaf%fjA9cawq*xK;x@fas_z94D=JST^dO<PLC{J)68E4aMdATx<Apuqr>g9@4S0
zypC=@Eh7+1RZfNGdyey%6nvo%D}Tj#m#bggX~oYAJ7)A<P%6l*mNgwsw!^=ue<cCh
zf}Rw&xObWQ;;(|HM=w8=@Sp88KB5>(*JTtHww~V~m%cbMf-LMfE8HRrk2cug5f?Ie
z?(zHuC8Fuc2~T^`jC8~JQ!epSDMIN36#7(P$Q{KOKfW(8bIn}*gasNJ%5UG;eU}$i
zmT!2@#NS)dg1=Fghj+$Yv^12WRSPu7b^dt7c_i-5GX+#?QNHp9b!;fS@{n6<alO>E
zHRXb6$rt()KTA$0@tO_xS6oSo3)zPr_pstca;Oi9)EVX8H{hLaZ{^$)F+?m<Xrziv
z8oh2G7fZG4Iy;T2F$TIl1_HY3dk<PK*t@)MT?$bpZ;ft5BPmVsT?8Cfmixy;IE9%-
z?Sc3rMIBhL^+rVxkR0L^o8BE<;44$-+p*nwkB&%FF&^xf6J-7blz65*U~3PE=jR}s
zxz``@pQ|ZJc9>vwB)2`_885CC6dhvS9%#7z^%N)sGl*auS0CoMIub~;1(PQliSs7g
z_eaLaN0-QFhaU>OwVpDKy*Q4wHS?^rucQ?4DH7$xS&c*yvTk;qvsVILMUoFrVH9aT
zs($2zz4PljEOj3~aUK!801{^+J3g@Iq*I$ajjaRR&*L&UD+aCVv!gwy&hO*&tquP%
z7a#e$%0o_g0Gr4l7n47OIJuEJB~1xp5gnGpiD1e*<+29HOms>HR(8Fnu?2@I+q>p^
z-V{);3V}<VpY$)E0#g{L-NxP|UJTw`4w>Hev^#_aR@6ozD?MinFU!y@rubSO%+{Gf
zZ6S1brMr@eJ9YDu-OIae$#`06TicCvy4#d{W+fQ4*+uD&VGeM)<-$_5!cM^ViX7MQ
z)tdwTF@D-IESvzRV>C+}`q=Lf4{nWseu)D}$uB7Tk?OPg!E5vFsc7CE1werNJTJKl
zHHENqy$3;G)@cZ1o=TGxCet2}rKsr$S_&Csn~&cY9y?d+9cxY(o~lk)VkMW$Qh`>$
z<+k~ewA52C?BH&m*HTH*AEfF2?5>qoQM_&FMLrh;&g%>$4AWiIKxdKWWS{Hi^7@Fh
zz9%SkkHCN|@r<S}2^E`d9Wzh&0e;@*^J)-<df^V<$;8R_3X|gwFLr$cNgk0-MJFkv
zbv4d9TaEJ1P}|Z=+)305GpS{oU`2NST(cX>%&&5Iov~AI;8Ps2DT6ShEK{BTd7L`?
zkyz-pV`w=S2*nRB?ARl}0Sc^c_2i%Sj{CzU2TDlPm^WF^^{YJkV=0w~^hiOtqiLXB
z3f#~-=j9r)iD_AflpJ=acTPd?Nbd`6RT6B~4oUrVyS5KAm`Ha1gdR!=i=5@#Gi_H@
zA{0BB;1(OXcc9HA2Ix@|fv*ZH9t^9HQN0jQv`QfHRpT3?r*fy|=zJ?w82u$Ljx@J(
zt~D_)V{lNjrK}I0_UhDpL?Y#;xIG$t9-dzb2S6lR3#sugbFdW@H*k(6-N}jGT(0tm
zIMJqgZgOVPg%PZ31*b{<@RUTzYeg+pc7%`!c_%eFE?+l0y$9ge*9LwE4u~#)HATfW
z^qJPAT<yx^iadQzphc@Mjeu{Aleo64VQ;*4H+aWzCaUyOY3Gg*IX}29H`$iI%D{86
zuJ%y)49mA7rtRr7xI)T(YH~^f5+plCK(^s=XLDnBTtxy+!n=X@`B1vW3Hn(32-9TX
zME-NSGuVzI#PCaO2@$>;YuW<kg?EFkh**f{+>3eOGnNdGkD+35z8g}ddtJx&0So+y
zEA8NO+6Mzl%l_Xts5{M9s^@d<La*M6mSd@SE^B^MLBh0~>5gWPwa(SbumqG4Mc%<i
z&_Y29bNZ-#>DUYWotK1IJA&A~a`;j<z8NZ>?(0UJ9^x?@Uy68bSWy#CsbWsWO{JmV
z9?gjb&RJ%-$f^sI^!Kq<whYSU+*<dQgHl&HSW1u6m8t@{GB)D)={DX`8lLNm0ApOo
zZsqCUDD|~$ztJmy1PY2&jL4Do4KqaP>+2vWArx1&f#TNrcuFi>7o2yavGs+7bE6-J
zg;E;+a)BD+hTFHHd2-^Irm6O<k1H$zHf|bBVx`-N<gZA|7OGvFa3QuJB6Tfx1NUVs
z)w4Clr$Ve=H9oJX$xYhP4%y@je7N`V@ga{j!$RL`x2AS}dZRi-_B^)RR)^b8_L2Qb
zlBjbTgB=x^w^QrdxGh8d=L!CI+byX3V=0gEu$y1!Ic>RW^U-RYjE}psB`zuPo1>IC
z3*3bg?}xDN;2fJkMY-E(f0Fc5tc4z@ACyhY6yeuVKX&FJC;(cSS)TbESLJ>G^@a<y
zZV6aCAEou^*}mWN6!Hh>1=sAX10Sd8!&&hR6^OwAZV}CBb@pUW#MQaVsJ$^y&JQB|
z=U{8NtGMIm{a1PE4O1kKfTn!RY*h;ddS!XYf^PvxgWiVQsd~}Y{5H{%3J2dfm6aJ0
zk`X$9%_%kh!M3)&Q0%kQX36_EWb)2FO*&@SOq<4NDN#YE5_bI_Scamu`Ax<nOa{~j
zM<wq^b{lMf<3)|789)a~(qgq><55&&Kf@nRDK6mx0$HS;mgWT3X>^@>cvbS{b7jhk
zHW@c2>Mzj_H%YLqjt9o(sp1WGisxx`n4Ztrpt3+S^kwGdKB+d=!=-!UeuaF-5G0<_
zCK=vF>3x^SH4kLe>|q@ZTz23L{w%@U8TYZRpdhJV3|4uFUmAsd$lD{Gb3rSH>o2#$
z1{5L3c3jGqz<Il=@eoY!d0N>nRX)8){)<<xqrYw<DpT_OXLChOo{>|%Y<Yjp<Cw{>
zX*)8ant3)0*RSam_+;+$Jd<O~Xgzu@s1!^-Dv9OXkven4OCW8iP7`MAew1T$bHq;?
zio~&xO0zik=%d`hmlCmEHd4YmrNIt8rxjZ!h~$vUY%8QUI42xO^_4(N0_653K8k)!
z<JKd}xBVs1RtLrg9(TL$JeWDw12f;f8jQLFj?Q4ru2O;Ue#CSVCSV_b;v?r~=kFzY
zAiW4)mV&NG01QV7#*+jxkkoQy%hV79E`?Frkt>U2F}^jzEntMiM{gQNUNK+pj3LA5
zWgTYeREMm^EP~Q3D!QY|XTS`PG}Ai2sLHOvG8<py$hlzHECb#7N2c;Q!SCxNbNb*M
z6?C^PpLUN``y%*{*!-gi&QOtlj+hY#J`_=4{rkS#0aYaoHp72zR{7W)^u(L{wJ(uV
zKx?!BB&xTKmcoi$`lU80{6`Egrv*U(i_(tUH#7IrHUq(}-hsAxhj<r)k`g8$-_TSS
zqaWr~P+x!DAHMEUHc}twqH`NJf|q8-a@HmCY&!{Pi|K&?bux=1Mp;k(5v9~mT?BQk
zCVB+f{`GB8E@G~kXn6)n+Lq3)HdDgYd;JtyFKyM|Ab<F6r}>=tkq6>?*gHsgwo*RR
zr~D&Rc(B!=dX&<Z@3Oq2iQGz1dr9r5w3H0A!qbW;pHn8w+W1n-)4XfoEe@GOPUDFA
z9QMw*#?az&8fY3+9ST}Ht5M&_+7B1KL)%>0_Dt=e=}qGHedTHEJ23pl-#uXwFZjBl
zvx6AW8&grGF&NLAQf(4n%~W0WL>9EhV^uBfIqON`-Ul-v${6-)XhObxi%GT{^aV?s
zy6o<lz!+U@u~(&HT;&MbP|t5Eyw9g?x>U&4ycB^$#be)Ny|h6pXC@dp=iRNmn~y2N
zrI^Dho@A5Pf=fr3a$(#-9F}-KSkH}}W$<H%8@;2w>)XZ^!H@_Sa1=fXl|0|TOV}ND
zf6)Z@?e8G>PJ#|zz#45^I<1$`uj~$X+sgp<57_g_yV$*{Zx&B9(~hvu`(0AYGt<CS
zT+k#R&p8JQV`V)0zE}f>I5`U6Iz;vZLx3|0rv(#zNRe^9m2Bv?J_VWG`NZO!ukxjX
ze*f1STs|khv!TH<)C=TJFWvzq$PBtB%N<5L-vFM)8%*BW)}<kaoBAAonwlg}OB>mJ
z(;iXWJt~kKKX?+~7wvje^cK>Z?l&#QQ=8%a@|7j;^JG|d#YU*?>OLmIRzyjoOwquS
zyqK!(05+B~EIMc!fr^h%yK69J+?SrJN|!Wcd3zHxD%F|L@ivQ`M7~7?7U=XF?wgyT
zt`m~?t5{tWe=J00pT$+Rf_Duh=V&DQZrD!PTa?RVDg;|KudL7Y=eVmZ&L+-5Kff1Y
zI0=2|U=agBCBe6%EK^5OnIUyLt5=#hflqu1g%qpo16prB&+?P$ak4WCf6W6<F;&Fm
zKV~&Dd@ajpDfRh#MbjwmOW;^&+0$b{qQgvd#l?g{FD9kRC*b#oHX7b3lNCsd9xsB`
z2IYk_s^PzjQkwnD2pv2%81_*~(hGPk!Z*WZRUIOzv8Gnfv60~U&>TMMYb+KaTJd3K
z;Mt|OR%uOX%os~Sc(!1X*hh!~VU+UaNAir#!DfSe8coltFS7~;5JHK>N5GG8JNzt5
zvaL>QLeAKNM`7463*0Wbf=Z!N7Ac#JW&HYGNQa-Xjk~r>M|3q8>3*}E=6(Sc=az`Y
zt2x43el0j?Z9p#PI^YxbYpSOJ^Xj(vS)5bIQAdAT<1zHC9#lJmiM{h3S3A!!dE8ad
z^ee}(r{4~AY2#A`NUkcnPs07$$KWG`VovPDJ0h+rwrl7?q_&xNLbpMRTy|e<x0aVx
zer2TVrGHdTGVDC3s4}ked0f8#j`?F_$;)&|j-DAkMj8=kv$nP-{X?8+xmL2?BTn;3
ziZJye1+xfEYWxuHZQ(FWP-L@z^<y+tD7%JwX2T^I07LCJcLj<%z}XIxRfQKN@TzOY
z7j*4p4$+RT>>>mW+qdnnZa0@-4*n{B;W`V%YntkxPF$>h?>jW;D~X(21zXLp4SS<V
zlddmaYXW;r;cWQsbM;w_XEp9THMP{aXSIvLo2t*&K3`Y9eXq0=gr8{YjwiVi%GoJ-
z^)ij?y||3q*hzaoSpP-DJ2*5v^yp|`ph#I!oxRWDSF^3~kJ5y#SCNL+D5AQTz3uMW
z*Lz6`qn|^=5TZS$qv?**()N$|h9+c1Z4kW|?aF1`B3GY_m!>1;pqIA`1F&M2ou2)D
zeuHVr4NJ9pTXmP<e!Fnp`o*F5p7@$AuI}C)%aJ*32Zv1!3&}63wzW$wYapA3Nlk=0
z?v~odK_vK3eLd+(Uk|@Std<r&yxf1>7mp%wN>}QB(u1t!@HC4Se!)z73f7Bht^qD=
z3=q}nLZmH!p>D?oDVroLOx}6s0kt(t!mavDlU;%1d1+helRkx|(|5Q*C9E9Y&`){c
z$e%y1y}V5erZ17rS>v0-?djNv;9@PvVOk3T&rAqCa{t%^pVg?2|0fV3-fX9Td~Msp
z8p1i^cq}&?SK!!p1u);oJ8}#y?ZsMr&ZZL{h*xAAbKkzK^3+E>+`i^bH#<ZnQf#%t
zlUBc<Q_st9t+`Vg74aQ|V65L`V0HH!m-9%J^Y=n=sop;sKo4@#k^e&CK^Q@DO7>z{
zO6ECi6^}qV=^J5$*w|N_(UMFJZ;#SRw)&iOjf^7+lFMJCw~zE49ivNt%|#qjM8|Cg
zA?KgT?|;_o34gHW;jz2!j$S%Iso{o(?}}(<=rjY*?&mo1+t$6esT373qq%m}pB)GL
zoW*4vZKQ-NHw`!Fj1a8L&L>+jCQy6!Ip4ooMUM#gk6a1h^$bqyqcezyR_U$k&J%?G
z_*6pveJ@H`nDLE`*42P@CSpBKBxa!GyME3sY{n*u20@kCC|htQDK&LWNvfL%t8r5C
zI?3|v+P$mxFs>^#+p4I@Snz_<67Y*&O)1(yRXKI*<#{4zq1=B@FigPAKv2DDX)i5^
zyWle+zS+XIarfJs<;H}?$hPt>=St)Szrcb6I{ru2OWp-7q2>mX@FOL0PIayqTyhxh
z(zSTg8^46*B;$F$*dCFm5=MXgSv64cn;Tqne$NZlqh14sRwR{wsBv8$iF}MRVDpl+
z^|0*NomY;sn?5@yyb@TRKH%!)^mCm@YY6|__8!@59ea8G1Y!>R&~SW&WTw*-68FRB
zkKCWH=*7TK`|cYNCKSSF*5S_$FPBrnhYqli2c^3i$FG<d`B}0bQQtXE<ZJDInedpL
zBs<*aR`q=%Ctz%<j_1&jr+expg%>~c+sQC+c55I`BD&3$&^Tnp)TCU)I9>Gx86R0|
zZz$uoEc0R<0`~rBaMnDS|3}d9aU}0UAJNZ)qk$dIigZA)U#$C!LgKBZXzWLHp_T=x
zOT<Iu+wPL)(RJtO8%VFMZHlK;2&(UcH3N=V4rd_Vax!STm;bo?wT{{ZR8Ir#V|GVY
z)62I~h;*(wA})2Snw3pbydi5Czi_0?t#;%pz~17@U1>sWR5AH#>WgHM1Ftl{t%0OI
zSlT(wQ^l({?pVH{g-&fu_4p1(m!uQ1zK{KO$Af7RugP}ljDPq-%*(@2T~TLq&mf$0
z0AePP-u!+VnXLOmK34;MyDKKz`&j?4!3=~>1Slxz<srjQ)8MSYjX7TxsF#_iX-mO)
z-fq3{{6Z1Y`FDw^#tra|2}93&Os%qs4LTJ=IDADC^tl|5?V{Gf`#d~`OFGl*VRLEC
z1${&d=-qE(IPc6*R2C)VTke7leyG41K{|(lG5yD}PWxoDy1iEW0l&#Ab>Am($!m$_
zlwj?qB63E{%Zz#ZI)j$tuVWTr{8=ism`c;`^U7hCxWa&R?3G~zJ5AW714>f6<@`Nn
zNnoBRB$P=bk2@MsDvev=c)KCJ);KN~lyP@0$)twWf92JVxgt5;v7ZSO`mF10^mBEe
z?Hw3x{UdUw%ig;cGj7Y>W7X?Xr&5Nz{noV^gDn`0xWp9`nDRt_u6y8J`N1fYA8}Sf
zIS)n~Kf@beai1eg`^C|z+%|3oP#nBxK*CV*R*nsi_!&`r(Q8P}PAIsgvg-Zs#zAu-
z2~tMCTU~DJoG09J@ID(-tT}tL39s%QTyG<Gr6>ccRPjLli9c0l_Ar2WUsgY=u`Xrp
zRPJ#2<2=>yQg&{>->;Vva6oV9GB497O%hLyx=QTk6PC_e2*5rU`{d{fVX>#-@wNNN
zu0NS<{=^znnLy3*6Nw2P+Bz8}5ZiA4YZ9>V`Cmnc?E^*$_($;hzw-~g_h}LEs6ZVu
zrF7YX)_qUq{%n``t_O7sai)!X4_(qC<IsZIwfgdHkM_bP+?K<uKva5fd_xSK5qf)q
z!REiboS{i*9lRa7mPvzcy_$@^l;3E+;0y+DGL07A4uW;4H;=LWdAXx6F@b6cqLYUz
zc=Ax`t!-`IB=jVz?6%?vn5K;Y?~m-q7MZ#HMZs^yN%e)MZf=X!k!MOab|<d0t0h>z
zAq)eFi)W*@H8=41)k(X-!|)0W;YW6!upQ)SRMnB{lWRTsITqrbl_>Fg>H^o>jdy0&
zJNyei5R%))R$te$SDiMuFXrZu2mAv|$bKX3W7GAT+Cx&H8uXHJ%>&VfhN2Ms7sF_X
zs-*&s_QEb=si|+1KOD=x{5t5Qjq%Fqm0DWK<<v*-usA%;o2&g$>w_K*LjAgUD`Zkb
zmx39BJYtx2uWFvewX^v?bwZO-%`jY<$gOXfRJ?IC6ga)+RcU7R!TQ6?vk16FX|*xu
z+4F2@U-XI#m2AnM`s|x5V%~4_^xWL!#H~vWPeX<U1VUF$XKXCe#4UQZZ=kAVg&Odw
z9h_+V$9BY=CM_TBgouGS%TAn|?K1bYG`;rS4!`c;P}3dJ0RaKONq9=2AGvsSPm!L+
z2%fJG@kV&a1Ac3VaI`qU-=5juh`7sHfc?BBkEUu?nBGocYRtUz_>ogDpv?EaH1lN=
zf5H4_=rKJ}Oj|<F8Ap=J)!=K#+I%&3KC&0E^>C3wkET9v^jJ^%bRR~*sYPGIG`&S`
z+7AW3*t@I{qeuLoSP0bydh{afi07I^o@Z<PIc_uG<CfFn@!&mF`kbe<edOEv{Fi1q
z90TJQA#8o+q<B)SJTKxiiM&sW6+RG!=<6;{SpMO?(y;Fp3mEcm6Uf@39w?z6Y$nJ5
zzAC)YtH?1dUt)X0Glbib9*FhT$FUQfdh|TWj%1k0b~_p)aAQ6_L%u<eu$-=K-85Xk
z0_RUY9K*<Dy|#t{iv}y^;uQ!P{tCnhq(8jzL{QL|qj(sfSs~3nk${nIqut;l0HS?U
z$apMG!~UC!<IIJ56h{lNiQhCUh^2ipdtj~)ko=g&@Rz!do0YlN3-BNkf7LB|`>rhr
zZaLIC3m9bnT*req1k7!puX5nDyoYm_s><%LTNHa*L!ERrNu;btm{N1DqwS8^kkXL;
zW=W4}hvv+>{R;d%jZH#Frvm<!rLK=jp6()a*Yh@wgY=+htl9YE4!P5333LU=D<Vw?
zlE4IWJ9JcY-X<Rlu5{#vATL#U<H1n-%@Qh1QJe<{r(XdXp1=LXV+?dHKnH|)94c*w
zi~dNTc4eoDKZx*LIMJjVJfFu$gk+64v^^lxXO1h3uDXXKk>l}T!o6K9W!<2AAOqrD
zrzL#;z2XKeT}~Y&DVkxUttr++ZL;;Mf~9Ct7Ecuqgh<M1%DiSR=^S`mVe!CPA5`XP
z*ZoLFtXF(fg)m#?5;o@@uQ!XHX^KW$w#<(Pd6=ll0sSWAqm!s}17k~S_j(;M%t!4n
zZ9h}wsdU!~_$hv&2?t*TV=CJ{eNIUFXcy~)R5Dvi0vlMXb~Cfp$j!v@7fEI@g8~x#
zn}qqNtL}y-(ZI@bs)wuF-FC*M?eBsv47y@*XAK)KEcEqid&E<lMu+_jX{}e{L)%_6
zJeaQICnQQX7LXnivbU?C;2h-o$rUR*Y`{bccX=ClU!IDy9)_z#=%NX}o688`nKY<L
zdDs#dfK5f*8^kSqo({V`dCE`ZWvBH3d^bbby>vdLS!iNQO`Bbn@u{&~O5xLq?RAIO
z>9-m40AE>clD8?wQ}kz#7q8-gp(pOVh18sjtoM(2ETe8L;zPUIehVpsG1%bY!T70t
zWZ^T#u^_z@Z~INjCF3UBobzwzDaS_cO!i00KHMd-Bj*e(d-}i8EY4G^RDqP?u;XMu
zmqs<Oic_FEyZw!kARh!edkgB88DYVd)i-PM^l&#cFZkXUiLyE8*1?eS0TXlkuhd5Y
zr!89Rf8~^ZRr`BEk^Yif`I|{iM_r~NDv(d6rUpt+@Mp{;B@}8+-b&i4_}|p<lk_~_
zx1NMa8QclN>TeTc#wV63AV1|(?FZMl`kdgUk)L*!F@UJnzD2*_G`_ScJ>o#N%2b<3
z54O_|3-CvUk%s8S?h=O)q_-t&PqsF3P5plEvyNa+Y(Kf9vIOQs;p10pG#x1f2?PKY
zfN%5q6R#xe#}q@g$5YL-EQ8H`0~tJO%K8Q$czXvQ);o<{gJ$Dt_$gR#K))t@MZhsJ
ztJ(B;JY(^*CTGW#aepMg-YTAyPonl^e-x0Q##%xj3KT7BG4g>6_V43KHg+oAm_{4L
zezY$gJT#p?g%c-lXvFdjRnnDm{*<qJJ^*E@(vT)G4frS+t&zl~NszHGuO8%kn&Frn
zNyHsi^GcbiCF3R#)@kxft+7!2(smy^dGWe?wAbTlV)KZ{*W^``FNGubkGl<z{LlaE
zS<hL7wz_}z30N_KC>(YY4%#hcm}O&CIFLObo=d$6O@{2l+F!e4Gy=}5JJ?UKV~juz
zC#V7gS_*z~WzGZgATmDOmsRTl<N|yh_vr<O7E&If8!%9ngFdXubyqtvPRF6gs!$}E
znn;@4Ae<_!rOvET+%AGH>tgA3hH+>(oO8Kp1wBx<q--ktDRKOvDb3OH8&+wVS`765
z&Iq9jb&3j8KBW}p6}5S8$Eq4P@-&&Js&i+fDg0b;#;nE)&_M?|oAjQU5FCl@vHDu5
z3C&B%4(lv);rUuciSdzHr2Nu)P=^_}%tgu5L^ci)jPj_*?E&rb<PZrlgMs`|xl4k5
z@pvxm?1YVvgG+DFUmFt7Tb9n4d7)anIX;p^x-yUF(7)J-evi$d(RW(A=C^xad|>m|
zR<yzxrI?Pw`^q9dBcNmBGOmN5q9~Z>ou0mG3RjQH-DDbkUOUip9DK5`)eD~`Se2f0
zy;vK-Up3I-mj7}QzaParM&65E;TZqWHW0>YjyTcUcz8+ML<PQ1^ko&pV~rWPC=}5T
zW1FTgB<S2La*xStdt$Kq&9?mJDzP1rvGQ303!4w{2%k5?c21Av4Bs4Qj0UvusGpkv
zU?P%{H%R$lhn&X^vt$Szs3p;CV)cg^H#7<Kir$XEno}W+M?UvA{q`BZ`xgaUe=1*;
z1-Z|7u}p!Vo3>1RX+&t}Cs#b4YsM$dX2?b_^C-HtmxqMkuCQ#{9HJ1$)=3$EKB9~>
z?gxZTydV_3apTX)%azC^{J2U3VH7d@n#7k}z^JtQE9GdTAlo01FBfAh+X0_&$&h@U
zUA0P|1_<H_Oq8BS4@`U(nKg(L<ro7r{JLm;DSD(zjU9H;-749a{a}OOv{2Ktx<xgg
zA&}3G)0B<}91$q$51z$Q6wv<pl!7o!w3e0yT(Ds03jf>^S=!V*_(=N!Kqyzf`d-ci
zzORSBN2lebxv-`RcYMyfj85t(^LWW9m;Up&E7q>8<M)blV0J$`DZ3KBf2ZnBb4R~G
z+{+QMbE4OmmuBljHBXF+U~<Uuvx9g-hD!A78n>k7KM`YP>*#w}s>@liM#eT?QCx=c
zw)aWQpDwyivs{C+yw)f3_^f~jvK@n9<#;Rt@b%g~1F($4+L{U{#1CbFPw2u#=&PFa
zJ!&C)Znc{noMe~BrfP(~2WaS2wIJ?$ksYxh{%l)jfO6Foph$&Mykv;OQ+vkS+@(Zv
zY#H`u+1s8b6BsU{d$9=6IC5zF8YrSEWpLylV8n-ud=0l-=E8l+pufz-trR`W!<106
zvObl0!1aXVGCRo$484La;}9-XAkaY_>yd>JNnLi?yho^1{QK%0^55}Lm9wvsmj}(t
z_+YUzAAGmPk+S{VOD_(EOO0^?nP$W+s-7cI<#E)V@M6JuEs5VzXq7OOSF{%-gO*5K
zJI-q=pS7OcGuJ@;6?n+y%+N_Sf0_TJc>bns$hA&-{)ReXS5yvVji?%Db;zQr3yMI2
zU)sgXvfyNe<ahmYu}K0vCvvT+-_)~lS)=br(TG&qu{$UiudZ7o+&)(A_Te{8dAzu0
zJ&GU;pI(^S;U6Bni(<964cSOK;1DsiwsAOEzOU_hl?o}F&BLB5wsklG+t@p19?rkp
zv9~QWcR-&H+=k29>tPni?X6eC!&Pos(Ga`6N^2!v17@;9`8fWDKcQdJ=>GXUG<bLb
zleO$OljpVxza1#t(y>9WiMHn#Cf5g^<Ds2~q*_LQES~J+xYmt_v+V&TFGb5MBbt>#
zYgzb3dxY?Y0oX$Ge2Vj3$`~PJ9**{6ruIX3dXbhVVFILkbNfr~GvG9h*lVpz{{R#U
zX?u#ifQ3S*SC5;vo4NFgyBorp)^ph8hT>n=es_OW%K8KY*A`7T%_1a{2ZNU9@K};i
zix}Anh%E?^o51NOS_Gj-1!FBDrg)*UzLlEfnmP!<Tw0=?U54qi>4FUQxRTU{HsMe^
zvDM@ie&N-#mn>_U5b8SpxOu~m;qxwX;lfTFfV9Qt#iKV00~n4-W&7n_?7-Rkls9>X
z>}RjO1)iHr#nAKzRKmXQfEx*q&=@c8`>9IZ7$9;pal>`P5+)|<N2k!)cWI0MGL5pe
zZ)s?<)88RRH$aX;t`*oTBjr=AkL<~xo>0ncLHkr?ASPGRnq$tVSi0{~(;Fok<Hi2f
z92uHo5u}&d);yvHzm`hS$};+9UUb>$bWtcmSO{9{9+|xLWQHZoK>~fi!tP7O^mnpT
zrKHTzNqB9BreyvzaO1vDhziRhN}1S3(p-&W8vz8KYqtB@hrUO4I<hTYfJtP>4m(Rd
z(MKswQneVCbpgbe1VrNF7uPb(8(@#&qjLtd8}0kkV{??7x-C0h=1*&zHvhoi5hksv
zZ+INW40zp%b1j~>ulZ=P1787OGvvtLh-<E4@r!OvZP+;tnlE1a0Jt`OM+@+RjyCXD
z?`>MeIEgJM&u4e$`spgyN^lrnd8f43gNDsLke5c2p5~`>M9YD=JT`Uw<1WcMPUX^z
zDEV7v{|*U>#CYpJfa&k6b)*AblDl^&P^%^tMpQh9t!X{@76ymEnUqN&4OuQ;xYP!i
zuur)c@f*&Vo`(b8clzFnUv!eWcEK=A>A+kW@EbOv(Gjb6me%dJ&#arUS&e=SY^>#x
zf_=F-E8%-V(^-YYu1ZeYdhns;Xo=lK0)?h9Yp=Y$nPnj@_M_Q1erw+5z!6b-N^9&e
zBTBOqsXn6Qk!^2DIBjZPEzL;mGF9i-ZrX%4L<L7xZ3A%IQv54vO4ns8x}~go_U1gi
z$Od)=<~J#@K?sBs9kOij$Bdu?sx`LsMRXTOO{tpK8xmazK=X0LtiVcY+hR)x=}UsM
zq(;@VmSVDbZSnHz;qO=BaeCJ0XOMHk`+)$V*9|VnteZ32?5(GM+2JVv3Hd#2@LhH0
z=#g9ge~Nl;1#0TZE`B+K9gh{~o1vS5a0**E*?V%nAd~Kx^?BfTd91lRORav`ELw!W
z&5tc_;;@RWA9GL;B@YSEYL4~Y^0{Z+{$)B2QNN;*3^Q>1+3zK|*YIW3doiVm`%0R&
z+M5VcD$@-8p>ySU-tf>?qy4>Kw2!Z7Mf`&=jzx1hPM?f3|7pTS%6~0Llz2uyU>a5K
zb8gpk_HH6}mZ$z^mhbh``)cgaQseHWV!y23C6d0}9)T&Z${%cJ3g0rzTCpy!5<Tnr
z&wzg}Yd=-;{EYqiHIiT;#BGhjcK8wI?0>Bai9u??|ATP8zb{k!kE<ADEd4)*-v1Xn
zJ1~CQPq>%CS^Nz|X=7T~Fa9~-1V3g62-h2`GNm|FlB=}?LM(T@2`L~L{_hvWF}*-7
z+BN*)<R82uj_z=sTU^cicx~EnyO9>+h=D9*-usERMQ5A5xHZ$sYzNu&e557Wj(-_E
zYe-xC+g?LgXtX`X>ue;WA%|Z{kmCh&3&ACST$>(w-ZA{!_Bog2b<u#dIyQfo+i{y#
zy3T+n@H9-=xME&hj-FL}bkC-?X7UE1P;?7X{|C>6lLjIB#jEP!((d^rtJe*#w#Vk#
zRznxpeybc%zoi<I?E=@{lmCV);wco0OOLky!c|jg7CVW3E-iK13x4OR6ZHT;;j<sG
zgY?VardJS8=S|cZ8!wgL)`!>&5H76bZ)Y{{v%k}$2FyOtsm?qahMrhI_^3nXIeRuw
zL$Q_$spI_Yfj;t2Ao*>Vq`@#H(IXwW{iTAnO;VA^!cYE0NC|AQ4)XdUFSe$ZVc_9V
zKC#_t<EC|zu2M`VP8!)7jn~gE>u*u^y<gZyM>h`KokFx5n)CUa@Sg!MPRNkmb1#6u
zdT;6%0u%%yA0kEUZb{PE0sa`zBUyw)ct=(nGxlV#x9C(4=|f)~z=3Mbfjv@0T?U?7
z(Ey$6u6k>J>*%Hz`a84ii<)BcrO|MReZ%nH`K8-g=!+U&=9a?J#vOD@Ssx}9(uTuy
z6)@Rc>Z?4l2fT578aMq3CP(~MN{TR6E$jx^mJ5!wM_9+&Rf9HUSMQZG0pr6VF5_VA
z1doZ)rL~r<;q}Ff1suNmtaHTi(Gwe3{R>3Q8zM}$ud4|Gbw~v1nS3pItaZ%t_m~Tn
zu?fpMT1&RHboLrC_RVn!%hK0}|Dt}26y?iB-T}BCS(>j@;2W>3A!gTKR0@j^tmSEh
zpV==T8b(|g@Q!rQ-H%=R9r1y;2+g#ERGUp4AG}R#d;UcYJ5G$pUchU}OCt~H=13IG
z5ra${*~UTOj}4>s8kF=kT%%hyCuA2BaMA{gJqFspJlU-v4M&DGa=nl0?WtDvXgqm_
z*Xas&YAnm`i-YY^H>greV_bH^P;=U74~L-%o?il>+|3(^1bVOc<Ma=p5q*^#_-!z%
zn_<n9N<hp$le2;G;Ir<rRj~FYhNlk0Pbd5SkrQ)eoF-aWS3sCGO*3)%y2jt=mLhUN
zYKnDqnMvH2A+~wqi9o1<C&m>qpu)_ia5;Hq?M3@g`mOKS^FaXtl&-&t7%NKwIA0#3
zZCE|^?E`exZRc|5ZH2Ub-Qtb>)fh<30AuR4DOtRVUGr~6N0o4R)+~yiJ8e7pFYzNz
zx#oizB9eb2s{`-m#v$mfB<0O)EUS-yg|C*H4yx~R_ZsP@IcB#4x7i|)kH5&B>Rt4b
z&z)Wkp2o(r#IetNzukOJsTjq3yXLryvkv)@L34f4|3w4~XP2b_&x6N36ZVc(M~S`5
z^Jo%O8=7<l-t!N@n=BZ)06qAx>E%DFpg6M}+~l|ORXA9Fb0(fF5Huz6ipR%bD$L*H
zqy5YYjwyNAQ_5@#0YbZX+0>1?0|u8=RFIKhdV#I7(l+d@)IUEBr=?W0WuIV-c)`<P
z(0=uJtEbu*(IhhBIQrA(Dj8rYVxqQe52$A6v@*z>M<deIII9cQHteIPszZR$;=BBO
z?wiYFqz|{-m`=k@ZBGZ{f&$T4d{y0C_hasdsTcqfeH`yXH7`G^wm_YO=)DlUUk<bj
zjrP0PDr<+9KISS3$b3eZ09GZ$?bRbw8x4L@HI|lF8U<WAoZjj-?;SuZodmx>)F{%!
zJb662%cp;#`XH%vG_GX?t5<oKurP><N1A<aXHzDB1OMx9JPCP@g=};0d`Ead+1|an
zPMAb)%&BY=L1g8ZWPBcCgNT<AK2MsD(+9I&PiL0hp6I8HY@5bJC>ArOyr)~P<&4jW
zO7>AH&?3%27Jay~BVJx^H|!wSUDqSwpVmq}bsClEv=uNFyRAC9<?JD&q+W9ZnPTqR
zu=?rI$^uVd|JvI?KbRAi<1^7~HSZn*`%Xj(Mqbrt77Bau6j`|`L|Hz}d?0#%xLHlN
z>erHh#;8*A2ly?D;0CPl0dGjTpJG#I?$_o5c8Y0Q3C4?k$)Il@RwB1jzViX&@K9lD
z`CG0Sl~LnwXZ3|0Fjd8L8@wiU%^pli5Tm3evcvWKtpkMGwltNMo`(2PBTcHMszlHZ
zjtFi(z>O@~McPGv*aZD;E;H5L9vaPfL%;D>K#4%)Do^xJtW6R^AM-MaGi6L1lUpI1
z$)i5n(C!Wh?IL<R=%XT66G6=_$L*T;<;3)C?gc_;c?MF$wp4eg+W6=f&O?W9EnkO|
zWj10@zdu`VF3@A~Ocg0>m}dI2beM8@IF~dFt}7)+b;X69^}uy_mw;Qe4uTtOzT@Ix
zgNzQn8U)+^n>L>w(FCrp!h-c<ae7{zAGiM97>AG7-`f#0-}f%s8_SC_vuPMfy<LcW
z45!alKb)dJ=-7J<=xa@f0~T^->IGC+&R$^$?`pJgWG6{@a?>>Tn11LAua(5jdxAZ^
zdth}&$lf1-9gh{|%sCK6=}XSi`4m3BarSDK3NOQNiC_Ne_kFvwVtF__dr<K?`fKqI
zN|klQ`pj~dT{yg2|B6ivedawm$ortKMDS@%f|}j8<@DuA#0mIJut$%5NbaG(XM`T1
zm}C5{J;EY|DW*qS$;jx6h67$3vSz1G<+kvohka#O$UfbuRHe4i1Ly%)2A%vH+TR@F
zMz<Mx&Pp?p&2WD<x|5QOrJ}@XR@tQFlC0;Y{sndqV^{JC0~`m_W4l#+OdiRxP%l1e
z(h8a$BZW)$yksN-gRm;t?e4}`VEmqoOQQxA>Z^YJHB^`&93=)gH^(`~V<^ZPq#_m|
zT^oY&GUn|oy|SH(T}qI_B*5C(?;|K~)o(Ru>l%eNt;#)rFrqMCyx~w3md{6ashG%F
z>ZSILi1A@be$P=SYyAjAT&#;z29^2B&rwL$7}WB+{$J?R?}zJ^$Ws%8UxUB>Vn{%_
zg2#aUuB5+2(>|JKAp#8WvM1Y`r7c_7dm8(O>xrL46PtpZLl>;*))jz=iS+TMhheoo
z(*Fr2#0E41wkrr+qQk=Fj!T<dS1X$1A4y(mo*QFZ&=+{hKk|SVZsT=<?_wQyyMOJV
z-KE?~b@MW~x|8tSQ2hb2wXXNqwkNox!~(a8gD2-@!TpNg1w|qxF1Ji46y?~N|6G5S
z@f{T^%mzG3x*9C}KK^YS;OKb@mw+~1vyv*tDbe&Wbhwx0->DZ=Sy@%3t9-2!g;~5i
zV5~Cuh1DrzYwRc^bl&#$5Ps0#70#^l+qG&Vq8-ZkS!Xv)t)nHVFscDS4(65_=@je|
zm}*|QQE3^BAeUU7u1*J&>bhX_IrG$Y2ohxT*4%oL$8}*U`r6ts-SiSu!#njyCN0iq
zqK#<1VAe%VDE>(GeqSvD{zdo>1_vCM9ErKLk<^^HEFMhqCoYVwCe47%Y-}8UXLZQ%
z>?+tsUz5UV>cRcMr`r`K&Qc8SBIT7`)XlDONl*M|ZINs?ZN-ZRDS_55Nezh$-)pMt
z7zVELic~yXkA;q#2ErD_!mT3<XVMcaISQ@LO)%l1aJ#^-4}10zupBbXWyPzjnR>A+
z{>QN|d&KnYdm3Ef7xgg0@vBX&Saw?%TjA1yeZH&+u~kXaA;GF~>OcA}h+L6r`<2>G
z2+?OvnL6r)7B29H#+Js2&4%#VJ%sAPQU>yEU>}G4%irak>j1XVwceXfY4Y274kMb%
zAi3k4JV(B(nu}RcxR+g=@XbuSnCO=1@i$eb=09=3dpn_(Ai8iD3<3#{;~0wl%dyj6
zGAVx`FS^k@y)>H0^jFy$BJ!WQN-kn8$cHWIv^tDwuvCUprkh%tMc?w=mm5$X@k`)S
z1k8ZdtI)G)7DIGy?TM!B{jhPQ39+5eeY8p~4G(Yk<k=1mq<d=9bS9^EIZHk5B4};{
zCE%Ib9~Yn2oDz_b6CXDShJ8kH{&;Q!C^R36Q?UytNJ?C&EgRYwFCoSlf>`6}9x0{0
zm!)|vsF*PEq%UKhBg=zX4(PjD3Dp3tqBg^=PPaie0JtDcXnT?sMkHc@e&=*A_1lFx
zD;)f|vH!?-$zX(b?wavBHc6m8zE34@?oN9hWvbmMA_Ei}$5fl}AeVs~3^%y{m8b_u
zTY-8kKY5N(T%pT;ir#4sNWvzLA>0PIXn4pGAxsrsKP!A<r*m^~eruvB+w5r@RxW0m
z$F{W6ek=PToL98?4|tCf$6){0&C#%@?^7~7SKSv`esZjTN3CvUHP0RokJw2uH1$&e
z*CYQ43}$K=tHL+L8A+yuA>SW_bbLR<II#ZsJFn4oF87N0OaH6MgF+r+7H0H!&-2`&
zp%YsF9PfSdzskMYw}5~5bpBuL?*HFCmG}d@7Z`<lZZ+>NQhaH32<-(q(l$B_ljLi_
zYyr%_C~CE}wQ>}1E-$)J2#SO~!t6h+fLHZF*P`rgj#SyY3O-dHUJ_Y5QS!g4v(@9S
zc6<BR<#RnIuO^q?<>RfxY!^H0SsUhEN_XsHfi-P=7h;WbbQ-jp`(et821h)wEtB5U
zEdTvHmj?3j`o%IFYnL=HeQ%ulzi#%EF_#rjm>t!hHUXBK%PU6y+RFwja!%hKF!OI2
ze!&{e-|b!e6h9=cd1Oz|GpF2kAF))?mx9?_2ovZhAIHAH>=;B2S(NSCW9*xsf+cI4
zepwxHGfThXfsaJ55zg+N!?PlWOjr^Z36RzG=%)Nh@8O5o$3&?M+iUk%8;+HV4v?;s
z(w?uAe-|;gJeSv#XV}iosRLcBbG8R0{25I>HE)T;MpwN&K4`aGDb}in&+QQ=!Z&i2
zn0TYNde25h3(UPi2)v99(vR#JE9JeR0xcISp*ENr{FN<AhLk6nRu3U7$)sznzO^!n
z*3z>(<fs?abwMB1ogL(FupNx;YWvPz^A-Yw{`N0ya}OoCLCiZ*vz4dhQ|I6DjMRiB
zFPeIs>sy2}#=V<YQm4FlCNZ?o?_Kb`v63DJLKL~?+A@f8reNIXe~!aUk$=3D<QV7O
zxb=aBL);A)G~IrIPS<8`oksl0cAGd7_G<;bTpie5yQx>4vJ!~pH8+|BrC399bordr
z)MAh@kxU60RW8o`#0A}8Jl}f_G}GAQ1c2xG#A$BDh}!F1z8aXisLdoLtZ6zzgIff<
zhhd<7qvvyg#Nb2`WI;4M)SgIua`ilUai36YWTX4-Pu);<&$9&r8-$?t^_`tE)9zXf
zY;K@O?mGPDU$Ii#19D48ZJT1HqrU;IuD5Fe#&v}q$293!7hmC9YxhR%aFeT;o<i+7
z<rK3xEm3%uCcO{eaQ<RvIrYk&@g5R-(Dmz`wQ?*9%+xaC@Zdq*2OG<2{<_U9ZULtf
zHk&jvJH=-8X7wbOgz_Z}SWUvXGAPB1dlsF%+ak|=o(N$uAs+G;i6-AHY14nR&#xGP
zSr#I6bbhP}EAG0~h>L(<Q#^nS`smsinMT{P{Or2IO12i@HB+tKq-k(!sCj!7w}UwT
zw3AJvuejj4u?w@=+^<KSRUGkg&fc<x-y$%U%~$4(p*&&xPSHZimcefV4|<%v#{6hp
z55KV41e%K;MD1S1jhErLx(AYR-(oiV`JU3sL;rI5e2-jv>92z1@TZcl!V(M#@BY%~
zBPG}~T7oe>__m-jeM+cXmj%4o*gU7&Mo?L8{WchM^?K(TQH2tyuTNUQu;WY#9oJuN
z50uv7<)s5eBI1xEH^fV$<pG1hwlRbaP+&KU%Do3ifON<W1s0E96=$d1O~H}fsnd}`
z%xs+x7n&VGcp~|BSbb%|PpxMrCJJ!mQ`zua(I@;yPys;x377;>qYycl;hkYzXKQxp
zA1iNGYq1{i1Z<&3YL4y>g{i;LazF0^BR;p8e_gXVA=$h=SoCkcXDZpKB!FNAGrp=z
zLl?ttR_8!BFVf7ziYnlf+w;+Hy)6p*={{+SmpZvupst4TxSKaex%9fDYj!x+K7L*c
zggCq-)3EErOd2=Jcq{aU{*Sl9=GWf9ne`>j@%7)X#$lCUVf{KpzU|`P{8je&2}jt@
zsq;ZML>nq3`CpHi-0Uqs8NM;c_5We-t;3>hzkY8K1(gy-Iz<WTkfBjfLL>x~F6r(Z
zQc~##=>`F5kQ_=nq+`f|ksOerh8SjF=zTxG`?sI{Jn!)yd+&eV<Nc30fPp!$>s;5l
zKI{8k3rgTqe6Qz9gdy(rs(mJ+vnt5_8|D-#EP?h0lIwzFzVXl{>qbmd)aDMs$g)+9
zl;)e(cpA76Nkx~R<~{OrDVGuDIq040Y`}C^BCRB*@0~E0TjX}awMpd#9izh0a?mAU
z*h4J?Za&PxFIA&goF_#mj)tuAUYZY1-A!B=yyKXU%jV&pjvuGO%1JvaS)JcW?ony^
zWW(=Ke${G7sSd6CmZ+>Zy`bqF+>$$<?lEt=BtGwqN%k2SNq+tUyuTwq^dN~h)@=?<
zo$bakyc821&%<X}swB6?VZ%0EmTuHdvb0%`@3Ts2W6$XS+Rrrrm%R<SBFN4dFw1wR
zIt}0Sv~qAKrVtMjvi02j@0+k#^huEsceADzkKMa^5czBor9H~PnX2vvBP}6gLJLvk
zOub#jLE9?FB?yPuud_p-O(55WUrLjQzEjq0FFLyeXB#gJoG^h$B>sjxuL2YzM5-k0
zSWUN9L8SQ3b*_%vz!NrmIT`!-VFgqXjjNW>D<VE)sI}so*rL(62`rIZ0L9Z^9sOg3
z3^<4@!yPmPOgB_0CfoEMHyr$(M$S7~-?DTW!Rz112)V}k*4b=#GwTp_tZVC=WS`NU
zSWXjNG~C^lxDUpxB9)EP%xLXNhUULU(;5$oZK%_?7K?gQ*sz^a3|<-?^*3t<HILaQ
z(=vf3>nWb?Z~uJJc{?<Ng26LdT2>4&HUb#~HmlfK2{w$+M=+MVsQshEI*i9B_jO`C
zH^&0Twae75CO~Yq3sqyEb|nWuhbv@s07kO}o#Xdmm|<d&mJHh<d)u@1iswIp`a&P6
zggXJn51NLG0TBX35&T&q^W07Ymi5`ENJojU(C|ohZhL<6HQo~XjLTA`zJo|2Yk|ct
zvbe9_?7?GiFyB5gU{#;XS}^rk_R>4@jI%R>@lk!rpYWC%;HuG)>?Dx3oiYWy%jQm2
zeF^o)`9Uqo_T62E7^*Cy<sm!4ONUq<AZN_SL3aWwpVPYU)c(E6M%>Fq)yM1dbkOB<
zmc#GH)_k_sOym`V1oj3IFWhCNg!lp?s+OG`>#~MWu*Rc>12eK=L995nv4BSjTMfUT
z_ACk>@>a?1ZJo>YjD3JMLE7wMQ-Y8d58SI4w3Ml**UJ>3x0unXB7px6f9O?r!A3w8
z8c>a0v>Q0Gv<ux5xSvCU?@Ylx_h!JKJs{PHh<&iv;6THPiF>0ipJK9OISy;RW+uy*
zdyPh4h_YD699K3@X}cxgg>oJH)Ij+>%IriRrbPhX)mFHQN)7h4@!A<Xp!$)`@Awre
z(U(!aHeM_K9b7$UUZc1(?1{OguBTPY{vY5^iR=|M&iS$zPC>)_SsmX_{X1HAZ0rma
z^LjF9J<!B(8@M%*fwksmp+S0as)4gzz+OeIC@Ly@?+fl-t&!iU{|jLkoBS%~9y7?o
zBKXlq2|1<CjJyNqeVBZYXKuWLa!TJ}0w7%%dyFG;jYKLy2$u~Y1b(itLSfG+6fK!Y
zXGw;`qlzV*^2DEu0?#f0jNf0XJ-Ei(`fI_JPJRCQ$=PS?0XAeLSG*?|8MaKHj1qJW
zx3){YpW@ZIVKs@v^}Cm)_Xk9{2LO2Y*FgoDsLj!K+rRTW?GxqTJ~4y<$>Q9e9w(>6
z&9r-hoCZCcK|bw?tV{d$?J-7#`R$St2Ungr#XDnWn>;YWdubFK0f=h;duAOorP+YL
z-qY;8!t59N08}Yk#jFOqjnvW)8Pn6pG++i#gTN`L-#PW0&%r*;6m)m<iRqNzM`vQt
zu5R7y%!k4;_M!x)*I00f0s>G~DJtCd&laytf0Zj8V>C-5!OnBx^{8>@Tpb^eS|M(>
z!1jEC#2Ln*=jL<BissdlKzP~wU?T9j4Y>QZ8!3``o0yz$rz0ZXpHDsNTmAdveu+sn
z1ow1d>PdfDx*AON61b5e9WJubG~#v4b9s@@G_}Xr6xS4av_IVvB)3k{t5qKUnI)TA
zW<nUN33WS9QBn>wvE0V7-R580Y0+lzjjtc-s(M_WR(wBrsQbM@CBh}X4q^~W`>ggz
z=l3c3u(0l(PlN~T6y{feDquEP4(93i>s`DRxZmr7%{+#vY>&GYz&m(QX4%y~$R$vL
zK0JT2$L0tS27e8&k3IJ9Bjs_{a2ibmHr8GzzdEgLH}-n>AV3kPDnFxfokIWCaW@A}
zbN*E{BxFj_jk`+tagV#1Q(Nvam!AhG>YFzN1`j*|1-N1{i`wjt#kZIvEkPOuub{*1
z_tSW5Rt0N&Wty99G~<NW{k$|F29dYG`~EcV2m@Enw_G+)32rjK)H-XUew63%&Oxal
z+Qd>o`w5}PYN!zxSB1Fax2(%#+b**Yj`T9zJrv9KtHKzgGfVlQ2xYOX*OFVQzju7m
zYk6&L=*{mVQr+iKd(Kyhxry&<-!nJh6zU^Kft`VinKwfrecPCZM)pa>s<O$3p|HZ*
zk#L+UeC0)_*Jj4ggx$~!WxJnyQ6av<X1TsLd(A0tW&jh+RrSBH*`(Sk%!g^-JL-te
zT`_%P^*H1H_Xgei)JhwmWM0m(yMf*4sV|Zq$h`05wo4nm7z32<fs6pq4{+7<yb-W#
zgebR8en?{l%?MDkJUVJWY+GA+5W%>^A^W2Qm$-lmz#WIzQf7EKUlj!L;cTcp;0J*`
z&<Bkw6Od{}7VEbDXTd2p4o~1G|1#p>!<!AJZBK?f1<o5gq$`f67#R0ZlH~UvOafMw
z{KXOAf}L(PP+b_@letZp_3i5p$)p?1=*MXgk&R;y^~@yHwi&(5S?-Jf0WiA(a^|2P
zNIZ_DANHDX(;uACb^<H~I<ae$wioDg&{-WC1nM4}Uz=~ot3we~+BMo;m5}<T&5Wge
z`am8GbQgP>wAL<Rwyg7+t`a`4$){IWb99E!PmX03XXkFN$qFrBRETzupUj61wb&4B
z*6`cjKLY)w#%T49Hb^bIvpEZB5T=>WvaZ}ba9K(P$QA$a-fBtpG&xSPTiQAPXdIfM
z>)@olC+0Ahotvmwam@SG*8vBrnBi`mY5VAW<VsKCI7|I>(;@x0wS_zf!A#WWczZJ7
z$Jw7M<&*Irk&J}lhx;+@zOu&r@3X#owp5S=h{=Tm1!dROobqZ$##k);Zn)}z_WVNB
zF_9VfkM}8^fOSNwIk%;!?8-bs9WRi~E#;Lb5-H#!(9n{LG+6eM=f6f(x`GBAT6FqW
z{29xAJaF0`;36x`^3A-bzq#KYzS%ttbpdO3MJ2>2K7z-FtcG6L%}lJhSYgcDhFV@@
zd>r4V(lvJ#$LrIltLFHxHJd93Ns)+|aN7>(!GI^tt@sDL2GOr*<b-vz7ys1jA9JI^
zw{Q1+DiUK*%5&(e<`5?WBjymKJB{Coe$CF4^<eX<#I8B$_o`eS<nD2n%=;bhmn*T?
zt@~~`sdQy8aEI(+`*I3eRCTlp)+`M2eiXTvD1EvtjOdCSZv@la?fokBsz0L|ud3SX
z;=DX}Fu|anVqx)A`K#TNkRxn|9^%d1uRl0>;<nxDPZB^tsCE|ou&Xn_wfm&?THCU3
zv5|;0f`(U{s<sJ&Hrn>%hYfzm>Pj8x-9{C;{}^9-0f{pUIG%uT)4$3!M3^W|<P``V
z0+-WgBM-1WbkPEWnQr_dqBy2Qp>EEGujS3FM7Lt$u`h`vxBuSusxmSkBj_z}oy+(U
zwA%0F5nS7*z<FKQ@FbEYBf84LmIGu&nnU~S#G{&AUdr7YoI9x-L$sg&EMZQ3&Wm~&
zgUoekv74eqDEkCWABiM{{fQ=4RT7ee#84K#ORWWI!;sz$CEG*RE^|LD&VfYx8x@t@
z=kU<cmw>OyQIQckZQfU9DkSsJzPU<?2p%#XT0c|#rv(2(jF0`w1rk9-wN&LcQ|`0m
zD;G{qQ*j&Bt)TD#L}ThfOz4^x!MN{opxHk9Y4w)OT!2#eXt>y)XV}T_CXG3!%Lc}p
zxoOgWun#}ezjs*-c8U5&f5tbE|DDE;p<kAtZc7OHrbDgjIli;K=ik3#GMPS01u)Pb
zRNW<O($yT9`FzJA#M<?I?+tm^SFf_Zg@YOLlS~N3He~&~NDkNwHh3A3e@<uTu<i?K
zLD`^AfjYb+Gfic~?$~2#!U<3bE?{*iIS0y(m(}Dn))KW)@BL1yg;JVE0G-q{+UdpG
ziTnlmi|B$U91j181vXRDD}ai>c2()DuCIDY69UssQf?YTL4<KXmd2c3^;n{^`aC~%
zA3Q%$F3?1$pR(td2&SpDOTvhPdu%f^@8S|*Bl5ZUo5=K8#roJZ#h+39=0SFb;Uqn8
znnf>HL=aav>atoFgH-B1+8TPgq_sU_ao4t7NZTtVKKC>7l`wk};1;>+r<Be*+2(f<
z!0dMB?vMKVr(KlH7a+~@6NI2os4mu36mvZ}$-=Du2m)yJd(1(9(2m^ygmz?W5kSd`
zq2@wz;4!}rX#;VgP?QhYNPE}DhI;HfK6B_acue^fnFErJ7M%%)SDI<f=cJCCoLu==
zGPD+9oGq=j)>OKLR&J}muC0DtA2&$@0TP-2U^>w9=96!VC+f`3XCrcEjC|9PVk|8q
zyt8phbR3r3E*k1%*yE?se?`dt@v*5X*XR3ALqfaJoL8<55aHi40XINFu=^iMfk^+-
zH0KvdP-b32o{OuJchg=a&+ZlF!Nut4dclEeW_47iQGI&j!hCvD3$f=oIv=-!{IHOw
zW!7f*6aF+W;KVBK5j%0L2E!Ui>ybyMS5*Ge7bp+ZVa)<$=th3YB9AxgkKcNTM>8(Q
zuRYp<=Q~w2_p>~F#6Pf5P!&AOD|TfxlU=y?FDP`eQx}qH=>Q(yjdX4thzNV}F5=Sr
z4-vX)w)VG1;b`@D4S>a4vrk0)x2_-s>ejTqXX_%-V7dG{4!D3$u6M~IW#_UZ&6WGy
z#_Bf`TN|atqvjw3+c#FGO0AHJw|3939&3$clK%w^YDGWRuZgPl`wfEJrlRPk$Dv=Z
zAacFIbVmyY?c057^^5EcIPAXh>-aShGO{fc5PugCL{Svc(jBx;21(GF*)`}V%Su-=
zGb%!YIg;Im9?pebn>QDl(EU=iEeV*7K^0n?7QMtMuWdP|NNGk5-DGkRoF@H9xDd5{
zk#}2cce$4oNNuB<)*3J2&Ojr!MTX#TjMeB2y;!fx(r>ZE3zOjQ4uK4qP7KX9?xk3a
z?kApl`$bZ>ac`pwgGX#3JCksN`E@-?Eg89@fNmt(-Pk>eir?s4s;Z@=F^Q3Elxxo@
z%A7r!+C1Kg8hv&qAc3lOT)T$T^IKv;7`#YF@Xj@LbYaABc5-3O#bYaPcQD|7MlZy~
zFp19H=NPuX_@=up>8#yg)2-et&SY^PYdDB+v2}JN4;3}gT`)BbT#YdifkreRo7Oyt
zlVW{bI^CGNuQcZyHn^`k2upB4_qL4gXHYfwH=9orglN3S1Ak|tZy7;p+^V^avS1*c
ztmEzLujUc}<KipIQ@f?s3!b>`?H<}Z8V>%(xYt~roIbJUbJ-+t5@v;Wl<HL=RCguu
zuu~#M7neN=2{lCQj=_g^w<WlGQ5iBl?i5OkUm)RD&+{)C7jc-N5|?C_ql%Q6C0v2i
z*|w3^37A>&_w@4llZkrUV;k?W%~LWNmos6v)s`~xbRe(KZ~fhbF|;4QCMSfvAf7MF
zKR2g6qCK_(591o3|Dmg$shLhZ-=K?<{pE5ouM(YMp-mIojWFXORo8blH&_Kq<MUl2
z><c=GgMI+m9sx)#zPdlAHl^H$)Ojs0^f(_cX141*<+d+Z<CH%C)^YFJn4-pI6m#XI
zq>!ToELSJ^dLlWu{B<MWqFsttfYL)?0#JHP0zQnAauqPi(c0x>?*Kb(&(3FI$Pr0^
znfilCFV|NJyW@3s0SeHel8CB$g52-ll00Kl+R<(pI9j_`cGZ^(N=_hJeb000uVdw8
z|4`b?8im?GWaI8|4&M$<`tIPW!1?h?!FkW2wvTj^;y);o*}o_fqP%uNuBG;}Z?2*F
zJa?t*OlyvSHtX6z$ZAD6zUj!uk_^v4l!@t;E?P|OA14F&oA$eH_idBkI$tx?sWv0V
zVGLfLtbY*xf|_f;9%W!qMHe7sO3wZ(-KfdtEL^GJ%gB}U<ug4e%((3kv^S@wYSx7v
z1-PEFZrJ<%O79F`X6OE4z}nZWxq#gt^j!L0zezoXcJuQHr%2?*;5jbPs;?!T#VFkQ
zn2_R$bwz8%H+8v|U(5G{p5FmGB{TlYV+5T)Cp=#^zS+Ypx^IoK?7K&7U|~#(j3jam
z-6CcOS2~YhQ576MOQ4NXK8<9}gDc{+eb5qRS`M+uTLAs_e5iHI^{y58It6s1!kP~|
zPIX3}eo8$r9Gbf<)HgpS!XJEd->r?jhgMCtTu3s;A;Tk!E44wFL990!{DY|N!>l)g
z!bapj0jKT*A^~g`pM^8CG{21$;v8Iyz==P(G*9$cE`-6@$e|-#Y~NH$KJETaNgGZw
z`-9UCHz@iV4&$ilkUhFf$>mU3nY;INIL0e=t_LE}3gR5@BB*ti{-u_AKC3!x!c~Xb
zqjq2vB*AfrA4m`DIs6%9fx4_`JnR47rs+Hyg|{MzJ)E}|x2v42>E}Oe7%-S^uph^v
zcg%p@$VldTG%URO4?xww9DnYxVCrn_@1NUFpQL$n|Ip0)Rfe0Ff#TfT7{d6R#ev7S
z74Pjn_m-oofwB{&)s^VkAze7dtFyIU{k@j+25Y7^^YbZaXqJ{eyv*Cekc%me$H5xs
ziOoYI{0%z$*cCxD(xT^Jj}1NDRvR7}dfuPp_<~!d=+m(t0h9ohHxC6goGSG;4!aXJ
zwFV=xKv6+jO1re?FClR#fps_8bQxDF(446Ic5+@U?W1C~zZi{0zqVFq7eJ=E*S2aE
ze13FSx)~erng^g_>j2}!YBwp4{LfO$8>Kq1Y8v}zvxELp$6I_IE0dE!%=2xt9gi~)
zgF9NpomX!7awk*2vQP9M3S_y7t()r7{SRc-Mr<*B181SnBwEw(SD&Agmh}$_a%5yV
zb%YuxzK+~Kk=1~8uVs3<bi?^ORUlJP;nd-PCo-Q8A*?VdSnuwPjbLN%8DQWVnOxMF
zfFVLcQj<INJMuHGAaf}?<;U&?)w=y572pi|Mi$B5nI;=0rkkXT%*tvmOGEg7<dEkJ
zq3AL*($wz`*IeuF40x37c`f@dbdje@_U=jfaLDvDNvx4lujU66B|jnZ8Z7XMu|F2E
z(wxoIHJOW#;M}{JLebJ2gJGp`b)w|z(lLA<9CLx~a7LiN<svs9VY)GdK#v2+Ed6?U
zdrOCJnmSSpRxp137O)FQRT9;K?1|+_j}r&c@h@7{zjGsvXr7Gu8XzyJY{sspPT2j6
zcXQe`OkPjBE2xwF^aEoW@9W+Dy6j(5J|~V2AK8}U+Z?b&6uD~R*js``XgLKP2ebJ#
z?0qhVUaq#peK^$g4F48z!wl!lPYO>cqAP`4z{>n$CSx&0L$&TnFTMEo9cuwndFT(&
zVGORcT#sHTE&1O|5nsSbEh7;3Ghh9T$eFXXrh<gS!`KDK>nA$3Ii^q58Q&9D0k=6C
zZk(y3-p4Ya%*Ni(62kxD-~K%Gew07<shM8_btnN@;x1~DCvV);^?POk6&yKGGUTtx
zfX``D(M8LOFFBqV0;kb`%x(uat(yQhTnmuXn;vS5cV+nB;8@_IYyS(5buye)_MNxZ
z9mAvZpD9)cQ$<Rp#W_~+29}!kUwgvW(h82-rYdPVwoJmE8>3LlAk_58*1)tqT+Ou1
z;78}TXXm3CiqrRy34^IN;x;B&$FqypH}Tc_=&;+?sG?zfVf{gPL4ruH5=sXz_&k9R
zHWXE`p8xGAyW<&qYnPEAj|?rgBeu{Sz3^sMNxVMQ>+YkB=gio%DoP6n;aoSstEAYA
zD!`&dC!!2uXP;W!RT}d!u=A>#Wph9_{>}SK9r?`3%sVZ#6AN};#;G^8^S+(qHceTM
zH*_Ub<UkU0*=bK16XMa+O<krieh9$@I@|bjd+E1uib1lM^JL}eH1uUC5&3r+1}4VN
z7?It?%w-sI!Xk+Rsy^Ijy~Hs2k<HA8VN7zXcuTWyL*N#c$-VzLooUU@&2h5$d==`U
z8G{!naFVw+_pQeRmYRARwVAZT&%Mg^-qwlI!7wP{j$_lyfEu*x60DOJP|3Ir7pL!L
z-PE3^+ufDW4rN}sYFeWJ*}U}U`}lKc9tOCeS6#U>8o2iBUOs1b5v*U+T)Z=}Q#bpi
zhlcvQQnC$W=Mg}-a?V{(?f<Z~ojn^$GF=Hr$k)YRA-h3N1<)&<NB7z99y376_5LLV
zl(d7mzNP!K*A>E<A2jD4rr+jTYMn*g4>F^_vLoy^z{0V}9xPn-tKs*-JI^qhk)3bY
z&gIR<Z|@JNszX-WTR-e~Oto}B;qitGF!jIJ(lo>JrcZx%`gmaaFvu|nzcI%lu;u3M
z9pPpSs)IMEV1o@VNipM}<~dLi8WhzNlkoE=6BiK|G)Ht;ID7e)34LdHgJ1&kymyS$
z4YjCit4I>;sP}g}o83y{(iWHAUXj+j-7j7S4Hqu_i=oAy1!1#%WfOUM6o(>r_F0ii
zo#%NY^5UF_>&vvA#J7QMI>aPk>6lt;z5AzX2EZ2lxtmA@sAR*VzLEvhmAS`e#xCc$
z1T>^DJZf6aaIA0=;Q*A3PtU>!d$~@TxYhzN=<$Fu+fk07^Chx;5P;Ft%`vP=2bV1i
zC$}}9MaD}t(|s!3YamMnLn+5BEasWE=&ovxmxv@DCEpk3z9e(L%QaFm9O(uK6CDf;
zzb;*rXUj?fR0`p9&74IHm^e-3^|-umvhi#-3a!f&eKhd+A4jIa3c*N0ZYGKs2F-@O
z`VR6-^mw^MX2aji(|EafImrO3^t+);3DD4myuJo?=EFE-5GADpl&g=Wg;y5;=awxR
zJhJq9iJ%>FiY-C2DQWB%9kT`xh3<Am?|$5|)5C=CM>s&3&NB1-2iqdt3zawn8My$N
z>?w%YK_6$8{8zI_aC2nTj<EnSTEQ8Dvc9t`L)#;RohFsTACvU9oGdY;0yoSMzJjUm
zX~;e1!gt*Rz>|-IO)A%t<;=wF8i<wot9B07i~+$O**k%Alvb`WaxK~MlhN7x0Mh>c
zG{3uagEQC6))9AjBk9<3d0z=1AnmDRFo4LYIb)ZO;9Emd-zu{@0sH!^)0<;Lk11ty
zPBxZRV-$JG>rJ>EfC|Ws{yP-hvM&oM?3s%J){5E;(!7l?zUtXg`S6SW8tWnsqSh*#
z;Ju$xOJ2)+=~uC$yLg)YS9P%tlLV?C8R(;r=|RW)L_ExH_;UnKC_r%VA&!Y{CoJIL
zqb8Gs%yk=qX$xla)iSh<>(CpO<22pqbolC$FOA998=^%llT#tlQ$#W1TXzum_!@lN
z!1^9QOE$R>#?ZRcudsmoj5QK>5EAA}Xgus3e#$Am;};5+T1!GRu1G0nmoqVZ%wbzH
z){)^@pm@&=;0{Z0yTE#0rBk)>uj;GC)&@%@F_0SO`BnRY!YcU#r|S!a?7DiHTS-DS
z!{NsnMkDn9Ekh%b47Vg-uCl%@bBzkGT0fFp_t8ld>pFjxcLd<lNOXF1y@&1mP}xT?
z!aXd#|BvQpg6|4&@pj%LPm^J%DE^7C&Z#sMnnJ!EdY(!M4TjbCBq~Ih&Nva8Z3BH9
zFL35Gm+n3JoxgS|=jK}il*|&xZtA@zqaEb0UMBps|BlRR{^^4GKQ-;--}O-cI~4A3
z;nv;%e!R;6{|Emd$*cSG|Ioym|1U1-U+SzRlT0P={vqL&8}(;>%)0BTcBJKZ7%cs_
zpvyA{X-@Nlt5I%jwk@^p`8+YS;nt6qx?eb2y?#_5Gh}~s&iJz27!+Zx#(5p51h<_p
zvS7EV94cg~T)?iO-2Cu`k;AVbvc~bfh8`Mp03AvB+DIDT$l;0LQ8!hX`WLCAGEbKJ
z(-^Fpf#Sk5oT`|=-ru;UpQHTJ=9{uNRRg{mMB?6|rQiUU9i=91Ep;KjNdx|OcPkch
z*3(cv4Y408PkGj;eP>NtA36$b6n*RVchKTc3y!4V`?Mqtnp)1M$){}h<bp&WwjB2|
z+74BZG#;_3H%=$91ERnPMGh#z8=7~3oZICsKF35zJ^HY)g}1HUX{{cjTQxM8+Y+@j
zvMYyqcpAkywi9u`ytT3PGKiP*3>~B9!+=n3si&%qm&tYfC4o8c<CUZJu^ydJyC90e
z^*9{&0B${UN2cMl***OGt~1%Fz6QB!GcpO2fXL8ppG8fx2j$_mdf*+NlX;iv(@yu5
zpQ&g!A9<BMIN9gc+JU5|ZAFO%U8gZQG?J4tRjZcj{V$ECSkbN@&!K`R-g{1~1&S_Q
z3m%1Bm`Nouc%8_h^2yYmx1HZgiW?ZyFGX|;Zf$h0^v#i*XZI$~#Y-dFKa0AgIj_z<
z9hu~wJ3~uzK}vsr0*`^*7!SmL4|t%X9~*|o^n>?Yz7`gu!pPZ=1UchYW%2P+r@tPV
zfg68_dwcFZjUiIf^DJ&Uzc@e}vP1TzF=$NdQ5i5Sf)clu>gZ!F+rAV&hbkH8;X1R=
zKAzh)v&5!}{kV)cY$ObFKqJ9j`q(Ow<KP6gsHEfg5z;-DG<xRjQ&Y8hG!2IOX^Wq|
zkqF4I&6QH@dPdoDQB@~(v}h}vc^(?YDj4pL!E6xuYBbL!b336c%Dp*~;Gd6p!JKx$
z{_O1NR@XmT-~6s<+JAA{G7Wnzv3yP9Xtdxt@7qH^F0X8q6_#k#g*0^=r463`7vyTY
zi6y(C##x6qOnHTEfy~_4`Zj@~DYet<{iJRN`O~1@fU4RhAym3mAiU{mLD%;h{ifmP
znoJ^V?3>lwt|*IY*1+Crq~Ru4A=k!pQSsEz>G;ezG8qWzqDzxeY@WMp5+bi^akE$G
z<<YgdI$n(aQ~Rsv1{>H5Ux8Sqkm{Pk$zwaw<YhUrowJM+6rb9cBz#gtz3~EXgN2;s
zs$ZPJDqA^f1TkK4>SW#|qJ#Dk8x4h%%@O9m`La+%hQmm-9aT!#|6b<DPfZWd`*U?p
zi00WQJK9Glr0hagiu&vQ;j!+@Ju~su@%l;5CVUM?vRI;F!HipGE2|#26!a6%L?(cT
zQSi-X)F6rZk}GuaRjuv!JH7(k4~zX?>({cDKf4KQG*s2~xOW#bybrUfKeciQwL{W^
zQA-<n8fR704eO-79L_iJBu<1t7WE4_^GUDlqHQTt9H7>#oh_F$Mwh;n5dh;$2;qpS
zhTB7FU6Z*=IH&|rNK+26(&jyJ$i&7_zPz_P>;<W)%_p}=%{8m(@kAH}(01>eo}&J1
zBG^6;!ZWqy*s&?i@fA;eZ-6K?LK)5XWYb@kxkl_30hyMs)G8Hg)`;IFZ*=8Z%%d7H
zI0knd(sDY;cWI5|F56;kAnj?ez8ZO8_Uz|sq0))P&*FM>{OHrJbhqP7bqREh1n3n+
zpNRkcX;7V1zHA-UQJ2A*p>ZuE3q(u;No;q*4p|8fw!%D#sFyt7Y~JRo%J!wA>x-=6
zfkvFa(ccZ-?Zp3vifwvz$}I~Xn5o<yrMqY=jGMKXocXA^wWrJo1Ob(z3!Lo?3w!3>
znm9X>vQBfTr<L#GUUlYCLgZ1k06d{MCvaiEDA$XTP&9uT1iojWsxMS}KTIkgf*8*{
zhH#+~cIc<u_y#9LUTsTBnA-D2aQn?m5arFLy+OCu@k|cth@m*hSpsBAHZW1YNYq+*
zdu~1BV2KB1v7;d|LY(<!&@C*C&jEY8H-a5myY0HiFA4PX97{svMiNfFI0;{e2Uiax
z(?iHbYt2FQFEHV+Jh?w-b9A{^2Y4C>)&V!M<hEU+tNEi}zrK^5jO(wp-Ji{SLo=5_
zSmz6^a>$j4vamZ@|KVwY9V+Lve#V!4|Mq%9ksW!crbt_cKyMnBnpc}Vx@2OP&<!G?
z!|(a`Vs|R&A-St&h!-{Q)u#R$Oi=es5ui*!rn*7sJ`H7f!~Jo+bm9>Q)B1aRkYCLQ
z7j_PkaB0lTvtBZ@GY~8s`hvl@7$OxxE%RRXqeP_+W=ww3O2lHAy50lriJ|Ex#r4xh
zG?qxXweAO>5IR}=b`iJ8tA0uE?=KB<48UpP+IA&)@`a+tRJkx{Tc^4JWwG|AOw`=o
zVyEA5f2BA?i<01~1LS5HnojjqN^Adwrm)wgSssC6NSIbV6~mdj9Fa61c`v!N>x@bV
zzvLV?%L7g;^i#<_Xi-+GpquUKOwT-@y3Wdh6%O0@Vs)$=hE$6y>GCJ&(pvSfJx#Xc
zA*22TsKAMuU0afj;#ofN*zV7lwTN!z@eQEGtqA}88b_3}NKQl9kO;RHv*ICN1m&p3
z4NXKr^EvueaxSmp0R7t3!mQ?nnjdbz@-UMn|5Y3ee(Rng@KuQ&ghgp>@Z_QD9fZM;
zTXl)Tb~~;46}3YN9TEIr5^xD@DMcA7j`~T}=k9-QzMWvlBC6@WLACTtRZes2`Dyb}
z)6$XBER4_Og*YJfz)!l2c)@+hDYB8ZxZ29)U5pxd1_U>`S3xCpm%)qmqwUEB7am&j
zO*aG$$$uCdR-m<^d2*M{n-QQ3p&GsSY2%64&jXc}<RFQ~PjPy8=f)MCQm0Gz`EJ<n
z_E4~*eagsL;p#Rb@z$W=)RkD7?ZDfM8G!^P?@kZQ>GymfBtQK=JM2{YjL@HbPXENG
zof7ou)z#J#fJxJj|B9WNQxr}|Wj!*s=Ow@Tl+tOep}8NM;SRrElAXGAzTVC^Vj?Uk
zn)<AKYKo=%bBIBm+9{liE}TGE7~vl$;ZaM~neY4Fej?{GQmu&Xr+GR*xK1L3cjj^^
z<L<dwucs&P5#43NFtI8r`$qc5M@Fp<ZKo%LZ`Dsn`n)ftRUrCo(psk`79p_+X)$hU
zWSjqc`G8q2iyDc*!KTZcIHtmeJ#Z$M(XtkYDO1#=rWcWnJnS>bdsBDDvrAv|+?ll|
zj9mnaUetE&QuzkpM+hj%a~G(Kp|T*|dTa*Z`DgD|n`3&lY3oR^Mj#4UHWZ-YOe;BH
zGz0@?UooAqFT>QFD9x*{dV!o1eLsM4?@UC+AYgNC`FeW2K(BxkfeAO7YQV)I&1eTY
zR?UvaEq9hq#D6&ZC~1Ui(LrWkee_mEO|ZacP0IbGd*SgukSTu4Q-T7TS5}~{pp|G`
z#In=0-nK-~o)9I)YqY|4JxV{3t}1?zR*zf6wnC9Hk(@F>PG9V*I{a=%_sjKaC9z4R
zo8Xm#R8N9C3{|}A;d~c9k9XoBuqo{px1^_?8xzSzmFX_9kFAD!$R!M-^Ov`Zv8b&t
zYQ-mlWn1Iq4Arv`DMN?Aa1Fn!Ha!Jtj>;*_Iw{qULzi|<)16hy)jgySCFWDx*Q;RT
z0XC%Uzk=DfRT>H_5&pQ1W$VL75F^16k3BGYVw5arc;%!1<ygpy2u40ldn9Fb@B2xS
z3PC6ro5utQvMBt-ZUCg*y=Jz(0d|ChzJilIA!@RdF=jz+<_-<n_BVTo)0AX-jk&a*
z77)o$L@n8h_;UGVQYG-f6;89Ufys*I5RmEHS9B4FAEJCFmYCNT6V|A{aLMR-RYF$-
z=nfqmm6@8-ysAcU_Zd1Z-!y4wkzSn;g0`MN<!|&tBy>)FRetAMF@o)J$A$=Ssmr2=
z?&-hVQm|cnfPT5Riuln?<lP&QDmqK#zT32s^M2!c!rb_e%c1_9!Y1hS)3J75m2eXr
zF>Ap)n&$@=qkD0T9xgjIaoQMI*zP5lZv#sHs7S1gW}?JcM6StiILpc^(|0k+!@S7~
z-vy#i;IT0&%K~9XD4RFEAvj`*szKe7@!CJ;r-)2>U6Vv3vb!<T=gN!cQSUp2Df~|M
zc?k$T`%v5MJ^$DJN7~SxmU;;8xiUi&O{D0UZ)W3&_%6I@7imb(Pe&Rls(~@xT+Jtp
z^1+;o>zJQ~zdEX?1oDK>4v)5Qre5^4gGZRagPhA2Hy2m>4%Wdhl}h+UiI;_~qBs3+
z$>%=nNxlhlU$)Xe7>FqPF`uL^<tVlrVQPB2+<tBI*2$`Z($V3&r=kmW#hHeuDYQ@9
z<enq|55Jw(<43{FvWbL=wB#px?uL7@oIahZBig+iEOFbt*(zt|HQ+tfpNrW@0+W5W
z*42T)db_)17OSk%wfi5f)u6V<lM-(zOJw%3J8w%u1Avi-N5I^gm}}lK95J=7(XOGO
zDwN|Xj4X`dyl5iB6tPs=Y=J9>>+%syu6gc6t<b$4C82lmi1N1cEsxHN>XGAebvjn`
zrScDRxVnOfTJb^=GcsD{sj_WNXM94Y2g!n4o&l1p5PUbs*Dw5AF!sF#qY?JCm_Y8{
zTer+kjA!SHL5nj$Z<7wd=<F97=6(Ky%(?59Lgt&|OG4bMrWwz}WM>KJ+8@&MG6WXU
ze6hQphs#LSSI-kOPkFyjVdDDcTW<!Byj(}twjG+qjXtTcwSXQ*2-;>Zxnsp?yHNZ=
z^T<>?nchbFOToICy_yV)Qd;xwf6aN7<_G(%F<v5i1V7oI*>k6cnHUb@Ao=vRjh&7?
z8QuT!lP?%McCvJpM25JEjk%r}2rZvIV7riBXJ;L_9?5LV!xQlF@hl_7zYm7h`tlz=
zLT>#Zn>PFZl-Z_U+idTZM%n;bERf9JuYKnER$rEOvq<L#{yU-%X4DD`Zu<2H`#nvp
zc%&rd05%HR`fq>b|1CCpp?H;>xWOjXn^f(ZM~8$C24QdC?8(|jd|YF)^gsO48ZA2Z
zrr{R(E3xR`^LKkc>M9C-kH{2XsC9MzM$tp9+WcgTrmqaR#xFRc^(M(;WrUxQVM!I^
z{^40d`@mW1D$zYNg14NImVfe;xyso=Z}9TekAl`>BKu#qDQ`UoByuuJ`%apR$K#oe
ztOx5&O(POZVr~mA-%GsHd`858>7X7zKe5ew>z}FYr*=@>0X24*ygafo4j%Y)m{kdU
zjVz0@*NmCpV$^x}2oxmGNWsZARx%en&~F|i^DeKDkx%E{lg;Ok9i6CYyjFs)-VagP
zGar|vr*%<aAKVe~)n4<BH&x0?)k87!QsAAuwy)l){_IxLgFc0oG1;p>^rdd4idSnb
z=E3G>FMblxd0qMAJkY%+^g`MDKD`+EtZXZ=Y*WdywmGD-<y&}tj5G;he(hWS$G^uK
zJ4)IKS^O_9bUy7L61Nt(=r{)a@_)JXw_D(O|7kA~bH{tq{~m@MbDwRmY2+$TzjQwg
zkzm(*a1{BU{+sLx?0>)Q+wK0@GdUM;=>Pr*=Kp3>d{RCZU8e>epjH<?Y1?t=5$Ev#
z*I}es|7V&<fyg17zQflh=oMA@UQ%mV;dxhd)qJb<yfHmWVo^b}BFo+6(DC2tPke}D
zs_(FnZIY_e(RHdJWg(U(6tPxh?(Ins)>uGH#2WO^b$CZ5-K5Lh@`dYBl(QP=5uPK3
zgm<G=s$ivizALan0pqK%=cmj8WL@UvghGnM(t`Kp>2AaJS2jI@kQXp}e|KscKGSbT
zzQ=r+(-gLHXUs{N-RZ~?{wcjgx#(eZ(<UPws~!h|hbSy{$(aKI2>aYxRo|Yz#Xb?^
zeqt4Gd@xtL`^hMh^-{%e>EwLJY(W5wfNO~ednK!rak&!tpto%S8S;1Ko4tEq3)6qD
zet0?}zMTQN^gIFJ#0DfFK|bw@F@cge5fM&jSh(M=HZNwX@?co6P;!8W%YM-YIO^EK
z22(CYJUrm-xC_7ri^b>>;n%f3y~p6$XqHEJ#ZL&>viRh=AfmO_Prl<8oI`0mi!hOd
z>_9fS0PLVGh}36ss(ttBiQLk)Y+TJTGL;dAybDRgA6H4g>cv!MO&!CF)(FXrBhe8+
z=#2f$hc5@LIWtWQ9^8Je<r4|n;XV1uH}WlntJVF7i;-ZlOhZteI*?&8G!Q)6b7iTa
zoisXECvsh|S1CWHY>ZWxAYj<nOxBu_%AP0@t%}aqCoo|dxGC2AzFs{i5v_eIp*!MT
zox`mI7@}VN&?=eWH3~pjE$+2f7cJO2it*k_#}Mdzggg)D)63PWv*JR^4huB`7WRJo
zAvxyB<|;~DuNAyS2D1podrzJYvkPDA&v3T!I(myimo1&^@u*=v+3pze9#)vM0iBGc
zyPZ|6*3EX0<iNz`lzloh^ghPb*pDQfEUYIa7$KZSPM1PruO4$C0G1sniXO%UjPON@
zO>r@kNXb7IyBTimY>)o*K(BDa>sIDeOkfwV!d*dxStI=O{L45rwVRbR8xqRu^zveq
zgqCkdr24tooG;%EyOuVeEW*lfO2S3vdaHq=2$l_#BORoZP><*qRM_wX6xGl6{jT?2
z(%cd;-iK7Pr_szF{Tz8MpYA^)>a(HusF%t<D$;{OR_eB22z#82C%{VFz(sF*$I7SJ
zG<S~gT24ZOqD|&y#pO~bi7ul=lREnYLYyMnqHQB1rlZ=i`lX(a_Fg5jmy~+4F+}dt
znxt3BZh5nXa*Xnr+1GC!5)X1Ze{%!Az+Z$tY@JtxK;&fV1x|Ze=0zUS`C7RT+!uOW
z(Rm>>TmWR&PaoPR5;J3>;_L;pbvD}Utrw7^QH>%w?Zmj5eM)oV&Tm8{4@q_-C>MGj
z&L(F#7C7KIj|0;v?44OQupF|n2VDbom(aGpI2pUiv{1ued015wxhq+uN1`<sU)uX;
zBi+;S6ZXs*_Z<7i7Dqg%o4hdSE-s&yBfkpKM~3t%#!a0>C+kVJkcCVc5s!ht*Q!jS
z);vUVD`rk2=H}t!5g*}4t)BHEltJuh%a(hV^&u)Hmu2@hyb~Q(Kbs7A&B2ZWG}ZIl
zHv4zzV0Q658_~j%=4y#c_5m1C%ue;fVkRmOq^#eJ5ZKEO3o!clbgWMAtgED)_E*h)
zE<G=Wrx0KQh*uQ&sT2%5ketYED+1(c$EfNszU&joz&;L(U16sc8JqH6PbV_9UHSO3
zQeEuVv;D1S%3~-b`<f9g;@D#Rf}*>o{`?@gXdm=0Uu{CAS><&n3Q>2kt_-MkOoF|>
zNvHJOj-gsK%rasu$H|O)kccT!8%`9DQx_7ui+y`?od2}cck{9DVwFXlgp|3LKsx{8
z?2NSxey&Q@sxZwhnzPu<2Z_^?=3<nb$gk^@iAx4oX}d=~SLe$`IAHX`zfO+7Z19Qe
zt!x1B)FXc;n!2%F{jeeE&6k!B${w<|*nQfz*+(pgt?~Cwx*cx-l0X8HVB9**K5g2B
zotaz+#@jdjxi;mDMqazM(byYKac*>V=Z-)JQq0yY>IQPRP-+#g7G#-S$mkDT1+n{<
z_3C(M0yCE!f$Xc@j}n(0cP=8`P<;E$#nV3az4|>$0Ux+6%w0vdSTLufMFucsmcC+S
z+c+tuXJ^4z2b_%HF_hhGMLT%U+6?&vh0-s;?e44;NUCkD^AREBD`eWM3~}>vkU-Y_
zA&t+d_xTHA+{FEuzdJl8GMS$!zHC0*EJRaSH{3#2MS5M)F?9{68-&aZj=A@9c$kI~
z()0qwc7Ox|sgTGw9cSMXOB?F^WmJ_?)%3}jE4vcDpd`%bjH~oD`O-T~0ir%rf|*Ab
zR;-i{&YR5je9wK<Jcq=?%Kcb}pDR9OUs|V2g|B%Yv_gLsP6Hy-U6E#q1vB)1*iy`W
zwq|K7Bjqx}lETHE@m3rZHjeUD1AWZrPFmmxz|QAL7lkM0(+15awHR+uQ3z_HYbo#t
zNICk`cAMeE?|bI_N?b17eY<x%+Mi*r&1n3Z-}9xjE)SZUWejRQ-)!$nGPPSPD`X5}
zM?7bIGi+NPEP7V|%9sMgwBkFPdq=NzmC#pFQaki={PIz{^3gmIVZ-VzbCPiN9BCF-
zXFw<OF#E1^{Oj|^lMi?ob|eJ^EY@3}%ZjDjNH|r`1lbpVpz633JEN3F*S$J5%?Rvm
zu{umCnO0`#37K}At0kx|NR^BzJ=Sxz%$r*ZMf%m}$0H>9;CD63<rsqtlPuhiyRu30
z`U*BRapOS1>bLW<NYF#bpSUK!>FD-}=NoV55YIr4x^pMLN^}aP4Q-cNjoKYet}38d
z05S65ZG3xfM(yi(+oC!!x`CslY+^Ivi_B4n!M4X!IN5cVNN?v*yxhzd(dbkAxLSR4
zXUQW!1$!(Hg;1Oa0xU+?$b3J&UTA-|RVE@P)=J3dUivs!!PcR_Ry`XTJs%wW!;|FB
z@k4nXKP;R&0vmyV$X80e;{Z)za4nr}w$ZjjjLhibS1=8wtU|Ci{guHS6T`HuYYR&1
zRQjx7MmsSY-~}x{$YU1afZSM;?B%uPuh8w=6XAl)4}>>&n=OCO=5SU}D6Wp!YM`Sg
z?HN79CSv#5;vzRH(RDjo|0YS#?<5+pMJLz!Vuk5;#7OJ-bDjr@g^Mio1Ug!U9eU!m
z8`e0fQI_<X{EKRJdG}O_-Gp}qF;wY%i%JH{F{S)%akop<tV3nY{E|F2?R-@6W4Hh(
zR(LA!chInFvYwXE72mWw6#StI^|P5iY3|94(AxATzZJoK)^lGbgX!UVyWiLM&Wh~f
zaMqi=%xN|#jZcn8MYO%u8B*q_2>~gdMBb}Zm*0+S#xL4iKDt$anc&ZB5%RgQZ;4Rp
z{$$=$3;Gv17zscc;q%Uo+YiTz+tje8k0X-n;NyK&XvtM<k&@5%jK7Jq(Tjg-2sQBK
z>CB}>Cd!1;H2pkXN3T}`t2|B=kGoVRDy&|9yk2_z`Az>Y?Z>rIr5<2Kpj6D6J0?k{
zMDXH5#t2bpzzPmUTxRpmF>sSxQh+=h_mX2eqo`6pe}XhF4pj>MFze_t6Q_*FB3io@
z_mib;9SAoxGAv?xf|NFQaIjSA9bg#<{#PD#6m5mXlyni~0c1BuY&YBqm(CXU&W`E=
z-X5~!3(#pAW>o-GxtZPlOPbpIj1A=#&4RXI{h#O?rnepq1UqZxzo+CTz|s4u#R?9c
z7kDZC@*dKD_Bk$rxlU=?M_i>^8UeAn0;RC*n?j6yhfzahqtlj&H^!8yL{lCOe;c;b
zsQrQ}CemI{^BPc3dv#>~t*<0QUDXGkrTeUodWzN2j$TY^_PF2;7rH~4_zUhrdirJa
z3Oor-5lw?b_4>0IG}9x9V}>a~$^;cD(D0pgS}&+y%8`mva{J9Yy>O1G<ss=VO#+Vr
z#;(Yxsn*u~vYkThSt%(j>`-nmkE261oAQLJYMDF0DMNF0yB3s#<s$@U;R5dGi7#U0
zoaPcg658kf+|#l&pv!TI{75PSD0M2M_yJD}p#+pAXM(rRa~C&c-XV|=>zBB8d+I&%
zeViu|?fmW*U8_<WJC{D+d3p}-L_`+T9+&nt>G*Z0Pn(VPA)SS6HYxPpgqGV#yZ$6z
zIQ_PIF`G45q(SXIXu)m$S--645ok>QX2B>g4SP@m-@b-8Os3c(<o!lPEpn3mc9)=k
z-@(sQ!r3_nn54{(MPWNTp7U)pH`Z0=JX!)~kEw%FIIgpE!j>+pwQt}`UdDNlB@1(u
zff&oK)cXOs*k8xY6<E}Y%&Ap`HQ&9;-*HKjD>(8!`4bP2xoPuP3+Rp&VHd?Hwrt2D
z&;I4Hl1JcNWnL;)9O4uSoQd5RQs2#=wOL=Awb}$C0WfPWOf0@IBl3pjB<%!t!p?E_
z&XVM_o>7I%`p=hN<2$3g=B#rcOJF>JBf(ZJ9kogiF~RlmudkO$J`D+fQi6LrZL0Xz
zMdbT^_~}dheoEmB&;+`2wek6xwXhBAOS)G`&Lrd2;c+;BsZl{EH%g!C$J^D4FNyqi
z;G%i=_cs#~4>g6L*ZP;m-*2?5W?I*bdQ?aY;R#&pmgU(9HxEf(w8e=rEI)b;hBF6F
z<*q#3^USEdh^A9|rP26Vz$6L$D6@OUZ7e>#JQ2UZ+k)gtAEO%4j@<s*d)*ryn!a84
zUOe;J51=S|M&1gga>EH&o00(<<g3wUuK-_@>P1zxd7JNf7?_=NR=r4Zua2!3l|*Qm
z-WV<X1tU((oALV$w+yVFy;e0n*4LCt7!l>TXJ(h?mI29-&hQjgDS8R!rp{6VPPf^+
zOOm%~Kn4Eur4iv#ajVr4Qw4(d{+P09pNjmlva$*`-J7PFo?kL0&pH%9r_#-ogeVx9
zE>H}x-84x$YE^U|{N~WwzGOMYellM>-8c+dI-ITtPGa>(^9{DCH}Ni*-Z(9u>tP^V
zFK(W6artg`W|=z;3wGKu{Y<iW3Tk4FsT5h=$X(b1;!OmeBuoSe3tOP2yT~FM@Xy(C
zMD~%y63Hz3qf&U~W$Jdmlw3T8J*Iojr*j3V%NY)D(xHop^f@DdfmKCbiHaFB(YOT{
z-K(NMWh9Uh0@y(=F-T-8jkXNNjMp*@mRX0n^Z~gwaV_eIW;!#y?!#`<Z`SD_<#jE^
z(CLjsj?#o|3+o{Z>vrGE>d%&X?3&8BRL{Mq<d{$Q)*kB(XFINzQB*66jw;N#s7s_f
zoOJ|=@3@9g!#cGZ<%6Kxt8{K6(wioYkMrOl1)?tuQD;-P)W*i^%IX|Lbev;+P4fGa
zs-6?JGNOQ>*Ya8L#h!laHm8Ku^>oSB4ZeNGYBN%fEiyV_Y<C=Z!KwWwdMk%mE9wga
zkyvk2h8e3w)<raKjS?`BUQgMVhqUZ#jM?I+6*$$=?fH>gF~859lhNv8BPyH;Ye4kM
zOG0L)zo5INBzTsa^e~_o_SkMez(2D##y7m*MR#A$l_gfYaXw2Qd^Cbd)1re_Ewen1
z0^q8w?WQAMnao{B{hhvs7+qPg?})@@Zd8Eh>x($IC9z(Cu(-Ft@l<#j{8(fvNiJUL
zFp?RegxSM13i+NUiR&H0cUkQ2T9%tsR#(R+>A~d|(az>x*~ik0o|J{OaN<{q$MkGc
zZ#f0Us%8+}6KHLg=d0Z%<+~ivj9ptg9B&!hosWSFUBOd%(-+q_&}htA`D1805cYEU
z@gr743GKGT&r!3|ZkL@BB;}-mAGkxIlz1?G4052gZPxvcNr${_r-?LM)-#rS7(6xh
z4#(!>jog+^{0O@RB;2QSEwX5ou}rWUwe<F6X^D&a&U5MnY8;VfILBhO?2Mzupa`A)
zj5=h?x91yotV31O&8|H&+{HJlub&8N`_=;aghj`N?THDai0Va+BP*`O@**PUdBac!
z_^kW=L8Hqe8~z54bPVX(L&jXEA<C19a$m8mG%2{WaG!|bN1{E@N!Pi;3^Qj#7wCz_
zN_RNj-jsCX`32qO^7zecPh|qB$u=TT!Xe25pXRSMV$F&@tnyjo>Z8XJ=bHPFJAoTw
zzeui^iy`65!s(ihTWk@cc6C`R^~~?(fDrl=pbj3>PPaHD+E@zXY-stq_gtQNIlNnN
z%cK&qh+SHXKMV8XX#EZ(hdgTj%BR86Zs#fl9+L;`aFsW-6o-C=KE08%auW)8ZtCxs
zIs^l37$4U=H#~<NZy^W5)CaCI=CY_}IH^|DlLfbd?g(4VhOhZH#UM1eD_$&sZqC|A
zUS5i|sy|?<f7a!K_I(fF&+#YVT5^gS!HdL^&;akhJee>_I$e@P)GCWKQEpA@4OC|a
zN24Tn2&nNqwk^^;6J%H>4@(&E-!^n@8;33sb}m2?9+m;d5RlfaV{$8F{WP8L{DRx)
zOP^WFiaj#K39`sW%XR4Kr4}V{$QE#Mc0MGLND7+1reg4DM)(@T3!DEMN)G(`&>25{
z$OjFLs2)n;pSYqTaF>fe=G`l4A0q|z%X+UJBiq@Wmz_WP`vaCKWd8Nt_s-e>eEEMz
z0+<hkVZ;a6dezQBu~LI3bK3GdiPOAouY)1jTjKtV^|Vz}THj`EhwZZOY?ATPM+$z2
z2F8r10!*>mMh_c4YSI4(wHpAGUd|ytaJFF=x29=Yk39EUpsC7#rt9H)gss0M-Oj{L
zzUBJ<3V<abm2D43gnAH;Tg7??xfD-uO~@o92ORjb&zPQha#zK8QQiLyzAZb=>$m^L
z+4(-tIRSZxo6UV@((;MO_Wzb`cjBgW`(y9(y9_3;M51R$F4oPyHjkl~>RaIw>$gwf
zm;a=M7Q+9ega^n~pL6fyYTGMON*N7}?G-DW{2sOtppR+PZu0WrQOmAgI^oM?_1RX^
zTD&E(nrzfO)@~Ig_A{gTaBT5HqoGR^;+PM1+8kR1D*;u2`T^EL)RM64;_SAXxzNv>
z!%YYxiFt)Ip>bdRgPrQ#1YA1j6Yov=OR$)--BDR$RynTp>5K9olWY%Z!aDcB(q}v_
zE0RkU*M+MOkprp&1u9+!F2+q#L`O@b{`nAe*|Zs>LS}?}bM{dgCGtlA`z9VMS(c8g
z7@}se&d+{C-?s$}aO=aR>R3|!Iqz&0kqOx~%@L_X@xUKG3^hK_7SDL+CvxXuS0cOJ
zA+rnzB7LuYKjDm*wpnM1ih7PEFV96MCIWOpX%i(aiS@04T}dx9tzNeDGX|EfR<Q$m
zy@`i(oyETYMhB%dG>I=8$CbGB%4h;61A-S;LkC;!4~8!JaEjZn-8a!hPpCe1pnQwn
z|A|)zVCzrIOVudT)YRDf{m%c11bvG%0>kLo_FC!zbywnC_ROl=OnZ`up%(LNdn$d8
zeDWNk_$3(DZUkRcO&Op#DletB$^;K%#N(+?5q3>iWqCJP3=yIDh~TkCrVLLF^{*f<
z_l1h*a+Kuj_|8-18Y?cJ6#oZnZy6S4x3FP9ih@XE&?O)x-CY9G4I;vTw8T&XLku9@
zB_Tc1N_QjO5<|y;bjQ&B-Q)A@{qFtskM|G9!5=tS+;gwB&UIeb3OcYt%Zxt%x%CL(
zT`1_d&5u*t`d9DqRAk~_Bm7P_?eoX2S+!VRFPc@Uuk6=z>vP%jE=Q}9ss1K9^s5>1
zrk*)~;XMNzd7Y22fN8YgYlu^Wy-4K8r0m8B!e>u6;hH$BYIVL_`a+Q2qUXCu_8fCA
zX>S<7UIkA<O|#MwuX}0>33|Ax08K%!D<V7M>fPnJco*|(sRK41oYXfEL7tLl#YmsV
z|1fIwZ#q~(AWKUe%D8~?PekjTS8BX2;m|d_3SI?4xk7ji?FF6NL<3^A|0D!--8K&_
zS0DLtWBbwcqL5$&P<wsW^)*NnEYNDAg!b8FI{`S`Uib4GQoY^M#ko3eP?w~9wJ_HR
zZ33GrI)KME#Gdzd9e?GH;2!W?7rr5pTBapOV>$Mz9lmGI&{n(;tr164<y4B=<!~GQ
zYkZ;x_CoPesy~1$Ppl*a{ZS1R87HQ)g=gb2Wqh0Zko>OW3}u_0E6fv>S4w9Es5O<K
z_whqJW_zM9??JZv-@tSnXZH@;Z!U6X0quwm=7=_4<GaFC^R9A83V2=#3IB{)VAYTd
z&lWL#lqX=XI4l5+inl-E;;IYY{V_yi@%Y0j-XVXeC)tdHe=Hz*q2EDnr!5+q#1BId
z_a0HU2nZy+b+X+qQEj~38p}(2#7Vg~Mg~4c$mTBP`ZC0D_?x-Aaiw;e$j#J)mx6<6
z4Bpd5c=Chk{8!Lc!`K_XrS4!FUsYNGe-ATRJZ`(V7(K@qT}n6LS`Khcnt0HMRYG>|
zm3H1f5tZP%16(v5EVB;>f_lamEefkPo7|9iIA9Q(KR{-upu1_S%Z<K?8@fz1M6R=@
z@Lh2GcUi#Ym;LBc(%y7yDY(4PLo=qXTCoUNEsb{d>Q5Oy4oK)vI(6|z;D74s`rhHg
zjdeP9+bO(vVDa`cW#OFrY}NNK>}m>ySl27A_rM+6MNHb_$O)p}BA%5n_i)&?O&dD1
z3{zb}b52~%9MUd>iJ>oi^$~jc3aLwYRh}NePX2%J!tYg13IwE}e6dL>)y^JzFe-Ch
z%NY`(*;jTXjQBm&k&$h9)f(tcA^!MtjQ`S(+nD<8QI@)7H!M0%bJaIb)|nig0t1d%
z`u&!y_no|c3q{bqp%u~7gGlDafNbLury<tccRm6FNtA|<Q-th{-5x8xtG1b1T&|*+
zkUom(sx8pGft<iqubc=;ZI&{*mHDP9gm+hllq9RW($NBnF{D;x(>XqKMzY|%d*m@S
z*}S%z^2(x^;kP@zDE=k~8V!OtNW!FVKx*p}+2KP=CzfFFv(JA7d;*?<UR^j5!s*ki
zb?fDFF8SuNbAarIO)}?h5y@$T_aa)e-B()g(vJQ~z5}vi7e?zA4stEcC@IECcDm`+
zmAD&0J@G&(&?s?)<LoZr#$24_{~~0!rC(Kx)Ns`FVo@&IO5sd8{n{h~ph8PMuZpiG
z{|~6p<H3KU!jHSD8rUzJdAxq<tIEC5yIgR88RfZB<V_PjG3;PMc$?UC@AvAI^oT%Z
zz=k)lWd)YGWC(``JX~EYF&gw_<S0;ROg!?NJ7Ncc#dgp_L$0~98wOun*4z?Yu%FOF
zOI7zN{faIpz_;-^M0kH^2))JOi~gCdW;ZK#XlN`4eQG=MNpch&Pv32?@fSoTLr_OA
z^ht-LMgNQ!wu;{%uI~cF>-b3_kkHmS{4>v+IAwUn<8*)+wvQO8K_%*jlctSjG0A?Y
zzf_X0Id`jnv)sDKp!bW$of;iasP|_;*OyQI8_gskdYNp**q@hF*=TkP9&pu|mC9Ra
z$10rI)-uI64?DvAOg5=Yp=4h<Onj~CP9HF0WuxVG=N@(KTVv-^kfIoFj8qPkMy2jD
z2AHq7W>x~RIbM614a1jb70@?x7#V<yz2C;AyW9Xa#PUU9!@K^>tkEY(o<B^>nh!iX
zp?}5gLWEW*@3eNlFX2u-W{6b<uol=Qp+ePR{OEe)iF0;L&RvlOvQG|i3G_cWWJyw%
zIUpbxtIZ|Z5g|i9q0;&r$;lcPWaCca0x!tr;CLdX=LId95k)TZ;~C3=1PVrx*s~0s
ze{kXRea1lI|G|Z7_Fw4aEyb3ip`>O)BiW8z(rYlVXFJtox=XV7fsMupd_v-gjN+A5
z!&MmQ*g-?5SN5-=Qf+2Fx~x&8X=_5pin2}}$#SmJAx;!UuAI)VG;rhZqb^^==`L79
z^SbD*&6omShlHj7h;+IDl7~PL58e5hSH@e<dc()2Dgv|iB~Mqk^hFopuE^eJaNXkf
z933cTNrllRg#0V@ey<A814Rr9Hm=oD5|24xsu8H9=nMNen<z_f-SSs6R4Fy-9q__Q
zRFh2sNI={0t4Y~TCI)`#6WfiREH8BQH$8D2Q+!jPfrI?OKX|+tatpbG>`dsN;o>qq
zX-+|WDmL65(%a?D`jRF}h*{+%g&9#2E4B{c!+?*#Q=gr1(W7|x-FR-Lx5-2nSKQ9#
zBlGQ+JAe0@L<Z)Qj0?+XKFUmjmxJo>hHi}7g(ElU4z@-x)rJ|LJS1n>D^O||iRbyi
zDEQfe-x-|?e6#0z<F5aJPiryw4J{89I{H=H(XS)3Hu!wD<2TQhukBw5qF!=v)QGsc
zx?COwCW1~as0&38zoH~UvTQi>Gq{h{E4Oc2EM|Byv$;L_Z$6Lw!H675MX4b{4Am}E
z$CfE#tbxy0!Uu-c`C6n)e&`Xtk+wZBjTKn_WYYd!yHnL`N@(2??3b^#5SW5EmO<;R
z1YYu3s%`~Xued*;NqCUn7t!mR(Q(8x&$jnY$3Nm@OquCNubi+mwGBdkGrSCdedfa1
zBwG6Ng9@^($Or)PMrL9g%^m!16+z%dkHZS78j|%K5<t8O-T6)fhWJmFna4#$pj%<%
zlALos2{0oIoa|3e|GrzL;d1&0Mk<^~uDARndq~z0AUxD}dRGhXbo-uT3U_@mLUz}A
z-U<}_q}76a7@OI<ZN<u`-Oy_F*9B%akeUX_=s_fH>JuOSkq1^?(FD4+JWG#*N~a=j
zfFt+KXQULGqC0wV^i*1;hKg?<t}=mn74O>^<QMVRShdR&&vn9398shoyR6g-TJ<e<
zZWxD|!_OW5RpYJTlc-f%=$B*{#z0*CAMXcaCBmO1iGb7h2MXt@*_=DlT}TH)B@*pb
z61O~&`QR!#IxpC2n<im!2`@vTD9tnqQwriz7}UAT)gjSkw<f8?&m||DcdKtNS;{<6
z<M@X(=F>$v0#$Wd->Jqo6b-{))~VOrvq)v#e0V9+%y3r{JEygP%+m1cukhk?GY)T|
z>`e^%@v1C8L1dNSV|T0_P(d|0kuoH*{0Z{TLH-|V_MKf#MYW<Mv6He-Q&kSF_qIk|
zzQ5ak10-0B;Sdx~2B%K5!h6?~H^}!6d6Yp^g8OIcbRi%4$q~_yP4#%%oT4)?u&K_u
zKzvqK+h_3{^reljNou;*4nIRVPew2(<<&*7E@?V4SF$#nXskJFSch{r<mbwU82X*{
znVG_pTFmJeZY?{Jvd@+DUJiw+wm(hmsW^`_<9cPu=FzObR2ZS@gg^C@e7cJcpH<$+
z@o4&VZHwz5wLNRkNe!He>R#uF!&W~83Q^RyiVonv5xbCtiZB^(ew_I-Plw@od(@Q1
ztQr~)vkXFqH}gD>Uy+1LUp~yzxas-MK2BZtEPU?VSn+-VnP&}uKXLp@?qvcV%?az!
zDM>Bf;o;9;rv|2&yk~t12;`$GldlA?5pIW%6qyENdL4P&rvFe{(<&$CO)CKWTw+7E
zHsAO*T5Ni6#}{4@16?mP&T~oVR%Lu#cIzD$WJSsji}&yJOKyySVnBUk-TKD^VkcVS
z0mlI;cE|`fQTv}nEgPu)gCcuF;aOF_Nms-XMGxSi)~y#eO`tr`mgavv(@(Rn-Y)W|
zB_AQqF7Lc(2s@s%T<739t#lGKh>D#{QYE0tpyqofI;zOV_VBEzQ%&>Do&<wW@h!5A
zbBUYtinmuSH@yDMi&<1Bzo#un+3BtATr^*xC0nDE)4Zt1+<-dU7sx4vbQp+&uCU<5
zI~inu=`iV@P_Hj4>|u}K(VUx3dQNhr^Bim`Yj%b-aJ{haNx4!1fZ?5UlEFOWd#@KL
z^yvap@w(TMNe;*-+<Lny-%U8J)uthCUA!}%)gZRKsakfco0WFY^cd1sT4<x(1cUk_
znl#MQ+`bJ3t$r<?rEm<!v)*KTW>*sBJ-17olW3+9ov^?onjh$12(I!`Y3qw&2<!1J
z*nBU2Hd{T@N8vaka~mK364Zw-=q7rDqK|}i8lGeH$E2dNdC}}A!RIm4++oj8!tjEg
z{U>}}K*2{Knqpa3DRTmyxxKn_`8h)~gO=_;T*ocLkGmQqlIgWI7JG7^)@WbVvu*bv
zq2|1j?e>@JT&Va>!MU}Y@KXiEt|IRWAZ#2XfKTc$^xoxol=toW*kz11h?%A?r$3^y
z0}p*_f`~H=Y;YLD>ffV$Qp5u|8vCat9*%aVM1%{Xcjr-tI%C2s0+6$LKbr~xy;b$z
zVzg%6auZDHI#{=emG`Ch-Q?g!f6MV<?0Q31qhx+lLg%kv3Wo0S40=1{`Pq4}!+<TP
ze<R3SeimsxHoYUxu}dO_;o8HkA0GYHfWI5`8+x1w@W-_Fz==xEH6m)Sv%Bq<1RGc2
zBr$w+I4P1=Xs_UEXW4>m{sQk#t??Z`R~voN#CbI0guP|wVUMg1BZKOKT1V|jz1@Xl
zi?O3zwsS|sQOKRar@Nb*HW+?~dav=%za9;}FqX#~7DT2kSIJSG9BLYKtn>x=4ttj7
zJ?L02Lo3N+n)`mW=VZd5j7-6b1x>^`;h`^wwOkocbuAXq8ACn}#L+bD8<gE-kM`w|
z&xP?+%b~CGdF*YHg$-^`oVZ8E(03*MUm@hf91%=K&lNupF6)3&RN9Nb7~U2^B917E
zaNfNTzi!RLk~+yG-70Dx4{dM0)CL6-F9dEfb7jWx|G|-&d5w0-gA<9@I~JXH%xX+x
zEQ;w}z@N}eo_p3yPsW36R1XeZNDrpRECP>52T_{JgWl9pKdHWN1H@7K(Sy5Z(D<sA
zT>Obwoy!MJy3R>n`zyAsd5ie&ZEiZ0h+UV0bw`EHqg@!kG|nb|?D>%%v?Zz)E0+L;
zfo^KAkxS#ZrsIhUZ|rim)l(h4)Pv_FPW~L^TU-rjZr#vM;}iKY&EhANTO73CA@%9!
zLjY8L-6g8<H;v@#Y5$G=-!xKd%t9i+>G?+sUFoJ7YnThJe<eH3VZeqH>oJcCikQ5*
z0qX<;S?e_u#uIid*s?5(K5hfm?hN1*?*aPvixwN4Dc2CF31p0qwPB6an>7Mh!l(Qr
z#I<efGI0>jF>0>*TWV=7JP3a-YBcSj%Tw!iI%Dl2JT>C81pz1>@5|Vf{D-4IE~Suf
z<W{*F7dcjWZwB~2Ebsg-|Ag@agLdf;lq4nMV_zv4v2-N;yM-zS?{t@y>MBXU+EQJ5
zwjKz3{)txqov+@I`p<7)Gyiw2`hO=qtME^etJ(CrW`<*hia=`-6e&M>v6j;LLn`=P
z=KqNglE#Sw7;#YK)~yD}9fav_Vf{;l{{J)>vjRQ(K0gEq=L$yr+Ofx;LmtA-<gjn!
zzj-GY>52;=IJ)a^Z2%`oZaGj6VRopN0s}JnUy>tQy8G*0$-nLE0#J1S`6k?8wj-pI
zrOKq#Ju~Mc=0*}qy*+jLD8LnYeOhDC9Zu4TU-i%!cf4ufXD}6mq1Q?DnyY|BS2xH-
z51fAC`ID$w?OGd~cZ0Nxw)~9~Ia0Vj)Gm48k*a}wmWHPU@$uY}GzQ1V<?L}h;ibcO
z@84G}Y?a|^GbavTcfsaxuVyCE<0mUy{V5J5Wh`q)WD%E%IjIGHxtiowCy%7sBVGcH
z%&CqivDT29JSqQDz|os?nlxCC0;Iu0w<-}4FBFrsyXlMHJE2z$)eRuNSTP3S@E;!?
zHfJ1uDrn9n{DS6{-KqU6vZrC;JC9xX70!~eRO<YSF_6h@PD7E#SB6EP6@gG+PF_IF
z`*(_Ue{N&rUm4btwRoaVTAZU_LO<NhEG6`cxG|6(J44Vl@hBck=V%8-j|LA^TDEna
zq?>X(PdW@15J+Uuj%FB&2KdXaJlnd32SS&q2<*XFyeY<0LMrmZL9n|h1Dmta9N%oM
zm-x|FXc~TC(Kwc{C6UqckCIDn+s~b5vYah?DeCP0UliX!m(@T(ba!(GV9M5s>;R@r
zAGDsttwn`nS#M|LfU%QcJt@%;)I56*-E*=VwQGQgGHFMlhVUa(jlxO!^W6e`8dS*9
z)iv821s#il@!L4~l$WtrEVxNmQX&<Oj;t;TL_<o5i$jAbJX=(6Y|}VeZ9P}xKLp$O
zPwhs#w!{M_;7m_mPSjl%m^J960Yz)YCxso!JCo||VdCP4VW3)l@eBEdy7}XnsPm(x
zea}2&7BD?u)2%z$0@^PpzLl|4>Eeu?j~{`X4kD!>H(NQ1wB%@SU1#t<`4M<<97z|A
z0UzQo0qv7bYs``H)<?;dm(}-t1umg(K1#dAh8+?_;*y90>*qy4r9E!hz1(xX;ue8y
z<}{tO;VuJo`q*OT0qGTB9)9EZLP5r6T+ZD}$}KgZ`*{WMQ-Y}WhS=w!4dUyP$lIJP
zQ_I>Im7<f9_k#QGGgi$RZim&gp5A)jDFXt@l*cse;<wBYz{p7jdlm$E@s14uzTh<)
zW7pX6)iJ+-uLHFO{g~ZQ!@`T^e{h~>7u=#bfQQt!nxMzwX%<SNQYq%_@UT=Ba?`Mc
z59d<Z`?Q!(jqTT-#SI-=x${wo-nQ^{;;i2Lf@sUCbU1Hu^PGFK|Go95_Lt}@(Q7;S
zRjoJIyaR{jAlaOlZL;_iF-j^7&4bu3RzvLus*JkC0A)m+^Gv1qQkug6XD8^=kAbh`
zdWixZ`?U5+^ic0(;HGpMMQEqQ?Y{m3k{jRB=O0yYbfw}pC-EB6pR0@-Rz1-$;6fEp
zrU^5>a53C>n1Jm<Zy{V{)MX*DS?fB%Feor?*il}Cx#cJL3oY8b1=%rE={RVs&UhE|
zlc35QVX^lB)trVm67AQvXBY!o(DKk2Z3>Kxl<g_N@n}xC_D^}f#Js4Hg#qzFb|=_Q
z;oS14i1P4RWpXPQ3jaR8{X=^z7a-6^DZEr~Vp`UYRLQ`v`b*T-`6|@KKZx2o-Q$<|
z7xGsy7Z1dZP69xWwsrgegWO39Mt(>l`Vw)Dui`kvm-*_{+3t!q^1wnOT8ogmUYqbX
z!^)XYhH4%DBaEoQ_H?Fy*RhXD40~#f@0R~I%`dMKJxwg|ufW<)41wfY${>$MVDmzC
zeCPqh2E`21ulHQKNIKQfep5biMNE4e-W<bkmFkqHj4`OF&Q=gwT78(EDs49?MNn1P
zP^)e4(_URC=&CQk%CqC-(j@AFOF`;uSE4}2QJ61&o(8m+2>JU=o2i0f$&|?={|iW+
z)SSA5Y#D!8aEtQ93^Eqog&7iMRZ+?{QZSW{1wWk~%7{bx0JlnB`ObI=4WGwhzjKov
z*%Cq4()kV7fl8w@{e?z0YBii|%YLbJu-{1PN{SK&<Y-IbD*0rbBN=;OAQ^U+y50C#
ze`|Ff1Rm`8Lyp+ewyK}4$p!Otpq0o#>za427%N^*r-A9g(&D3Oyn<K?ov>p}b*ztO
zARPKXtn!t-nTYMLD4uojBS4>MykwmT|HJVnU%qZ6_pp54P3~{?M?3qn%-GdV1ez1B
zieT6!9uSFnBgCYnK8W^Mn94O(TyrF17f*N~<FNKyj}mAZrTEp!nZ#q@F||y?WmC4g
zjDNkFLgkSo@kcEWe{0JWxQcA$Lj#-U<G5QEZaUddNdru35HlG#%yf_yBkzZMzTdi<
zI+WPM*J%t@<ntdWH8AXqF5FIlxGkPeIlCcc-z#mJ^nqgM#SiXfJjasrJTn9|j|hc$
z`W6R<jCiJsx>pP2r`fEEg3>wHp`MvX*~>6aGjV+9*6@~B!vw_6AKVU?(;R2uP}4|U
z7+P<uHsNufxK+sUizo)xcFDSHBpHR_K3G)L@TC9*1MO3!Bv$#)B#Q`l&%aE7#`&;e
zmqtSX05Jn@QTy=}&yJfYmsI=epk<u?g!@-rk7Rz}_F4CbqFfFB+(s4OXk~*9h?t`a
zT{Itcv=Wq4X^6B~xx8f^Wq6Gk>uV<cC=~iBs+kg_O3=q)uDtIh%lOo;AHcFle(HP!
zd9AM|UNy$<pARevggY2$YHt0Zs;j^R7c^R8a6Q$1jX-mL&B)S6qU)Su9;HDXxAyB~
z{d}yp)-S}WLZm83a#3vDO}YlyvU%@$F5`fY9Wtk?9d?WNAyMMet`-)Dn!b)_6(WwM
z@1q*CGOeb(^t&QY7P<j7z=`}+iP=@WAGkPbrp{dXP?O5)cYY&qkKqk*`N||QznKEK
zSumH%Ewd#(Cl#gvm4OaFS{_@mdZCKBENjoZ$kUmW`qooO<FP41$l=4jY;_K`=)f2Z
zuDXp)8sK<w(jsFf8>CbGO6oV}q4dIepm?$9E{`|0$sPfyfs&LBjI`^vmZ!WVdiU#j
zi)h(;DZ}+#Mh%UmWo;v%zy8QIT$@i{lcen}N)MT(Pc3@C>_?N8`p-Zk{AbeI<HcyC
zdS;tR?KVL6Y90&+z`pxRV1{rDROLUjTV({mJGAZyWo6)VT|)ffIlJ+Oe%x^2QYM4a
zOl%FX>|GU5xVQd*QtAuEGRabC<ggm<&)MLhqy=@K^EfH7qdR{yz2|{P`oJzmJgk5e
zZBV4R!w+KyH(ab#G`U>rl9*f#RuFE({5<G-T1c_MVn!)TZ7F@(QR{JHXL}<P*Ynun
zXakpFNi@>+ckva(<YNp+^~-awbx~|il-F(PP3mEw$A7T7{cq{7MD|7Y?Ts}X6}B_B
zzdBybi<Ma|8)5&IDJp{!{*srIg)D5%fbsbag;XzBy<oq=VzpQT`fRtJsO~_n!jyY+
z@qXV?^Snod^VOLZC4Nz*+_ggRgwByZs{l#u)~i9r8s_O5RCw+~W_8;GL<bfQko~vV
z$0q_EMx#5^x8w@EE>}kK|C0G4&O>46;a%C}H#S+p8vRqirt-^j{{2ToBHj)%`%Qcn
zD*JJv=UlvgcNQ4uERlk_x|kb3(YY7tDWCE~z9i!k-G4UY;-gxeVQL^!@gr#|%rC?P
zr|XG|%wrma8bG&U)J<!|?P%{K-z8M^V9cUrC)4{j29mxUN?AWaIDf4jj^P~=-)|uk
z2r8%;ka)$L-~MP_8%7Kpdoo*DLIBj+b64thnfl>o+8v4(K}SZkzq{s?0=K*pkQS37
zZMv-`b#D3<DK{`mdUFk~modaQW@_dqK;HCacz>QTWz;i9>Sv{DE!osx6vNrT6lOs5
zBFeoc#dI=6)`(-*P1Kl7x`w`5mNWLr)6DmG3FCG{e!#kcM?tXfzgZe;GRsyT?<(as
zVQx0gVbx6$X(_!&L+5J0?!9~ndjPm#q-YV!*fbYf!B;EyWLa=IndLn{QdAW9RB94r
zn#~D#7o#V%_!Ry2=h?4V<-hIX?Tb5B`&wbA)7A9>AGDMpThy;-il*vSKEjt)3AlS}
z#}VwjoqC@U+_s`tBD2=&a6@^#-qr<*KP-(C7@R%^D91CB{5a2=rWx#&?l{5;zdYsX
zoa<OslO16S76&QI+Scd^T!#gb*~7-(@7|DJ+TME^cb+Ajrg$`?k8lzn_Odn_5~`-}
zZW>v>uH${&s6F_mBIUmxBiOE6lL=VeEZjzIvXJ6~yl1MyjlNEUD7#d5gjF=ins)gK
z#S&oYCD^+KR5!Fs{vl>HzyA=k7M=}&m~By<N71Rx)a`qfqyT|#yIC~6V~kL)eQ7GB
zHL3c{)dz6)hUbwomHB9KLw(uEzLHhLHr5Sj8}bh%YlR-}qP)9$4;qcX`ndk&y(!>c
zt26%*_XY<Tu|FCG?zH{YW1iJfH`y(|=OS`xDL(HBD1VP-FBIA9%ybP_SNU8<>1tM5
z?mT{ixxd{Rce`BSn!ITD<;Z>*AUl!mb?q{H!K3_@e<<;ZLku4Cu62~y)<n_U7}AXS
zIIFPidjRu0n0(X#XnA5$o(#=y0*eU!p|tJg))5|tdj31r3(>=Vka-`t06DuCEq&d@
z5)hWi?Y~w-D(mjWy+Kz<4#7fmG@9p{L@6`YvmaSp-)QZ-ndOYr0vzl-^4PUyd%d*i
zDb>j-Dk7aSo#oL()bs*sdOGk;=4Q#nhZmKTZ`!+9_ddPLSV^L~>A|}tepC{+g?(0T
zvdu{02cfq#bjR0V!;b}x5{gfGBAnBw=_(&O1V>#-U5yo>Z9Uwjt04a)>M<{^dhAvi
z8tSzLa6xBnz3Q!I`>LdYO7K@JGz*27iHRcE;WfZnH)c({K4J-8dM>=+z;b(>w^ZWg
zANa$6C4r3}_!XmD^wlzmT`NXf8M~9n-Z0O16nqU<<2Ppw-QL$GRFUO4W!q8!*5)VK
z$$R}ynX1$^#QTrSNW#N<z9HvD%r`?XUR*bw$6M^3u%O`bcH-E~m}f(qcBBVMJ$RTE
z>lGgWdquRAC#JbjT0=6+6&C8Ukt4iEJnXH#wE*~fkW>BtwDkf#Vn9b!r7+&JDwhc8
z-L3b{WUN)eI#i82GIVjUqQHoe42^Muerdkbp*`17egI8@A*EUgr=1wgNe0pLto}{1
zO%=zn9JG+sCifPI)oEB7%B4RpgYY{nInb%JQJ*(97Jc!9)UIcERf{i>X-lQN=oW><
z%Fr(|S<N`NE7(V&Ogde1WN+k^6<C{A70+|m`WC^HI_J?Jh(q6BLTI%rH=V3xlXnSY
zv{3gcUzKPMG+5@HchGy=l#M3E5UuOTq@8n)jcERWta1;*eYu<kH}8FZl|HRGO^1E^
zb4%_z6aF3Jm1uk)Jza~Qq)JEcPafMqOk0+dP<pj&jEm9g7g6V<X@EC5j7vbZDTOif
zQhCc3ZOPQOJ1F_j|J6sCtjXbNKu-8u_|V-;OdO)mz(2DF$d#oBa%ikfFscP&e`l2b
zY3OmV4LZx98T)$)8e;7rjITeCQ2Ke3A!sl%bTS_JVZ2^a!L5>H((@mpD7R7~7V?AS
zr7mmK8s=w$MJ|gfT}*z~mgVIU*K@?d_hg_K;x^0`c~^sc%!Z0t=~u0}k&%(j<cYpD
zq3YChZzF8(r6VpTC!?tLpY<C~GISWJ|DE0iN)RBtwv+Xr_NJ{%Sgjuf1X@4UVh0?r
z|46Qr7#@%uBtuhIMMTKh^eq8)LL#T_Q$rw~bc1P6$_mIEf)N0R3TIC8?SMBcpsQI5
zpc>$UW6)2B{s&n}0m$k#)z0|OWQW{ZWc}6(kKn(1;(}v*fJiY)!u#{(#k2pu8TEgs
zv@brPy1E(*NUoL-<%zADr`dnjzgdYZJ{sf?(+$9{lK5Y+>HcrB>SW|!=10WOeT8q*
zJ+2*4nR7q(#?tfc4VizX-nWQWxS*HLlY9;z4i$EZ3n_X2@fufc0ji$D<=u=b`<e$p
zkZvP0>DOiUh5?kHRs=cKbDiJJyRvqBvEIDzb$f(bB+eeuQaJ!-9Q`U3C{f$}!*n|6
z6Kn6TCTgyEMe?{K1-n=nYz!MFnt*yT)KiE8EUu`;?v2=$Ud^DP$3<;i3t30SKPgsS
zO81`mr#Y-D$mSB!(<Be%s3Jyo%Ad9nv3-eK5adA871%Scv`nI96*R-}P<ou*M%%L(
z?BxStcY(j<I3&pZVzt0blSzz&;<f8Nino`u3+`T=9Klxa;lbTx--pJd^C<nlVEK>H
z_L)t>Rkm@YFGRg>PJlY6+hOk^sR?(=<S1Ec_KUy`CmrT^C(9cjk&_%sOVheT4@-~a
zmo=@qU;&cIQy%|9cc0zUf5&RQlo;W70zWBEt4c10j=^a^bQ`MW<K}=f;^Mkpe@f(2
zXg)GI-o0uPX$O*8s^F+94U#I*h4@Qcn3cI!aFDMO3bFlooo_g<05njM71=D~uXWCX
z_bJE{+iZ;5X5Tg@08V9P_XuMbvrn3F8?NwEaiELq)TU;wZas8iwAJ1RXu3PJU?zHI
z1R$z9l&!|Hx|NrXq!>g+B1^{PJdaXtg(ok(P!wz*e1kaiB$v-W|F=}<i-M>NuAX0R
ziR_xEgRK5dsO}5Y+lQkBWqWeZbfB6?4EJw&4wbvEK&a5;ggaq(pRnk-)s2P_irFrb
z5>h4M5)uh<*rnJu-VXbaIoms=ElcFxOAGjT3=w$5ni%c=`j0zzIquL0h90-f<-L>I
zf>?^l0!>S)0nv`Q1ypJ*UL=^<L32{G@a#F{n}s(tKu$S~a#+@+qDs!M59XY`<2mO5
zr4CefL)Fe<P^4P#@_dN)v->5yUAXj&0ChN&b57bx`Q4&?s^LUsqqdL`=B~|h)6Zr1
z+Hh`i3*#;b=zelsHGW4+4UB3~D{0cwhwv%hjlG@Y^-V0I%L--nNV04HJetLjr}6&#
zs0pB{>mfI~zybjYj95r35(UD}E^RYzEA;`-^Q<`05rNMJrOVJlMPIMIGR`~Mue~1m
zt-GvxojsF&n);51+U*ng0+=lYaK*$get>v);QO)<Av=KoYIk&b(j3Fu*`%Iz^_Gqd
zPV|fC7spZB{;>rre@l$`lfNB$56QW+opf!P&G5~80gUM%$8PILjqn{CzD5+|(aK++
zFVRrtYvQ_L@f8$@LSN~rvO?6naOo>krMED~G(e<Zf5+-udh{vLuABnq9i$G2&kM*M
z&cX`aOXq(FT^%XbEbI+Q%k<Ye+}iNL^1&ZRnzcep2zFrZ43%DX52SW_@ug0_Kfeq@
zSdj1+>s1dd@EeLJiRwH~Egra~xs@gH>vQ1gD`RM1BbM@ARt=kMIo3GTY)!GQv~8*q
zpB)n+{XG9mAnS~qa#G-MUn}xllbN{zk~y2Fe6;>*n0T0xgM*3xA<;g^aH+kj9{}0H
zp1i6{5WjFHXD=5VIrjwOx|jP(wCi^=kfi3`I2+PMZ9EaRMxkh)izGw4>B`;=8XhtD
z^!egMZtMr*_*ja`O^J<1f6kSDTx>fb{DB){MM>d^y&<x1zoy<kW9ffKkQ}8}c&jml
zBjix5p15o;il96YR)uZB(sh3f<>XhVDvn1rp2#>VGHBVsb_)h`A%~H|*CYw3b}yyN
zrBjJVz@iC=d+Qzh4EbA7AKSEbaWMiO-B%%WTj9x4lkz?sJ?e%?poVVYtLRVH$a9JC
zN(b<sv19vl1+v0`p2Xv$lz6;fLRdpaY`AwsQ6;HO=0Vf82?*JgLG=*eylVJdY8Qsm
zjPPf~CWT?Ari?K6_!`l4v$-TXF(_N-uYI>5@h9G~?z_NFnRM00{pJ&RqXyhy3+}E%
z_5200lJQ@1tEN<oFFm^ZdSDV3Nt<cxQ{*z;nK4};$^z6&o~)0niti4|Tl#OTZ0^KS
zD0Hg`UmVRaQcRFIbl_;+2FZq3>XKICCsbV%{~``vJ8rWt<GppL6@x^HUdQP*b~%6Z
zNb|5e)K$k#H|+*!o2Al-4A3<fa!>A!CvkHrm+^7MG5X)R+dp0$Nw;N=ht}vi>}B?Q
zsV#yjWEn-2(DzB7g&Q=ggHP5MIQ-}P;~K^3(!7^kZ!L+w+EIW$b|yn6hW7!s*s0bo
zS9SS5@?&3})=hp+^A~AHtgQDQ$#j&iMSO3IT<av$ch#PYmIgVM$hA0ln<hHDl_p}8
zn`VMf2Gg(E^(z^j>O+D&l9vAx4&5i8u=wjFy$BcazJ9D9d)gSQj4s}p6o#y#r&^)E
zO+(Y~e^fPTV^tK-Qb8f#pMXQwIIpwKPlCe>q_O=%*as>500EC#Z)V;7#aKEyHq6DP
z>eLMdQ2_-nZE<y~JyAfwXZWsiS{AmuVvl;&(C?L*vNBTKcI1E4l$>%VNYXZaW{cXg
zh(?{K9XP*W<eM5Z3xDwT==$iE{Bc^~nUY*Q!yxydGb9{uFNpIe;=Y4)N4o!^@CC>6
zU(#*q=1FiY4tt*~t~XWf>EUH%q-Un2Lg+8xxRClc2$E|$jLPhk&1ip<EQzGIN^w1S
zrYhaiCVhpq9_+Q5lWzv@*P9QA{O;s82&~K_>>;O+!eIV{h(E3~#4M1L!06WcXk^9A
zWt@u%cihD^<<<JW-rjlIxvF)Tqmv32*nV|p87Zq)rIj@V(JY3JDWFc?<MT8;6s{if
zk&!HI{&;r6R?`S{Qfv{s=z}S?HxJ8AsJ;te*Xohp$L1)tt;P5|rJH%p4m8dg&j0jn
zcg2N<wR3%`9k5}dI+=eI&u)v>GHr8D|9+b>AG!aG^>OEQm&9|%C&<^yg0jh3FZNG!
zX3iC+r6Jp!Z)n*)Tx%ayG5nwhqP^j$kBFsF!;2bMLulO)%S9yM;<cmkOpbjKn$1tY
z0$6}7lN%>aF8ufLS00N<Pz@Nqouplfs<N{v<=wkR2thsf3$vm(-Ew~7e}iYnsp?Rs
zGas7sM_L2jM^tWxoP?tjmPcghKKyLW=Q30bh&c_vAqUOebJ@YjO$^G75^&Xa@$DSR
zYTDgu=Djj{&%c#B4r@hKxj=MM<CXAcB#%R>CZB`PH&p@Ue%}Fo29=$8K)N%`P!$u@
z&L9g=IC&)PnFrKbPI69Q;t4#AO|yKYw|${zqN>G&mSD(1_E=DJeY*$|1V{+~C||Mq
zW_?w86VT}a9NZN7uvgZ+(pfPp3H+<aKPSsJ_|XYhFR6`uUK6*O%yQ`al2A$qOe?dR
zbYJdQzkh~I0PA=R8d1wr@ssv6cwt81)g@E}1?sDAr#bFAWl3CCg!fD3XY0yZ*1if)
z5rHh$mK6Xx#@*ML4Q}IT1H#cj=`;?j$k9L4j<D%*ADqMm8RdtRcG6EdqvqzAI-jv_
zhRMNN6Dp>k^qq56J91>cbwfbJ*wV!qSn%TgA_Ll)u_$#jX{uz$%ta30z4a?4e*06Y
zpcZW)lO{}Do_nYFF*-K_DqPF3$n!)R&)sKW_#R-=fxrKcNmpNEJpLWnYucnaAz48V
z?k9qz5_y|WO;0qUd>9(X9wv~K-OCikxo3{8*Mv=9nT|)4jg|Kt{T{eC)4**T*u9?_
z6Yo_@@?NI$uWkWSCt>J{PP)P_la+BU@n#3#VkZgTYC49}82p{uzGHuin&_hTuu;kf
zT~fEsv)s1gAMuUYm*VE%re0x2o-5JPf-iKeOAdd6>Ec|kVtJd@JS_81D%JDH{(hP3
zNS!d_d5C<PJ6FB?B4o$2#7$ekAW*a+9=BVSVf$45BZ<D~nICY>UXqEfkny0?V)NPd
z>jplXjWlCZO#<7&iromFq5)hadVKQa%h9@{r}fG7Sk-ppqb6i746Qvmv2l2$Ad#P|
zrMR&Q)|%zZ|KxA!zX17Lp7o6t$dRX<ImKTNFxuXngn`h~g5p)7g4V4gdtkJFqN5!)
z;WA1)NgU0r(fu97ElkH_sEldMSw>lWy8|O3?i?%STin>Pl=95uQ6G=#+39LH6sq!i
zj*{b4kT(dFTh~JLqA_-AoesREXE&~<Vh3|Kio{PXT1&lWL)y%+oZ)>s9dH-5MX&hs
z?FV&5+~$oJ-c-N{MttK=NTh@G>7Kq50$#UzOZ^}4aH`VzUig){28F44aH-_nvTBte
z%ezM$oViT__v?giP+eBcwt6Hs<F3)|6ZOdq-k<eI-=MP;_Qgt<t5IlF+mdK?1ZG^s
zR0Ys=IOL{VK<sc(JyT_xv&Q61>aXZ-wJZGWmk^uB2hKVHw8!Tl^VjN|tWAY!feIy+
zrcQEi#8_!nIFG51OtWk&=9T#W5$0Oi)6n3vab3ktw*t3(F#>4E7mY`uEj-U*Cq3Ao
zu;2LEuPw@pL0+R|IZ?NnF9x^#+39!>tyEjzfEq=!xNE#Tw_2n7zYoQ)#KbF{(Ee!F
z0us5nhg$G-%7crcGtvf;)<HknFZw#ny{uYz0^NA}Ncq_T*IBGbwRkrKSB_K7VK$f&
z(?HWCjcKP3rj3W60Hpt)k%Jwo@4-%o?KiBNG;OcmgZ*dXWa)3P#(%s5gyoG|PMpyX
zw(sVCg$(h%OIiB)@U{l<^-;U}bRZvA`t{j;i%aeDR)PqO__(eRrs!S<E=HDTNqrG{
zahu%}dK{n9@}fn4-^Vg3#f@Y7<YNr4bFW%>n{wB!AA0uXBw6bt_V7xaB6Eyr6<=Cb
z`v>WEU}Mzi@KcoY{j#B{BCRT`q4%`|Kd^n<-v|}X%@4MzRg|-E_%Ia>D%QK~3&{Gt
z*30siWajQ(1eNOjxYgMB5sd{#X^!d7tCM^_+<I!i1ca8|4}i9tad3ik&iOzlFU9NT
z#+P%X8>XH;i2`+#H~>B>i15r8)0GCW+B-IylSd{oc?hFVb8YJBI^x(r7@~F9%g2s}
zJ^hV7J?o*mayaOE?97_3qL{G>Y8+fd^yI!n#)9+3r0F3NmV!ZJQH7Tpn7u{rb&?6E
zPot@RNg@@=Y5=lUz&u1N4>Yf!Nv$Nv;Du{c2O7xfyo#r0Z5$7F*2p#gVcLmQXU5$Y
zE~GkU*P6DiF}xV{UZn0}2AOA;Qjt1Lp;v80vRdF)O)?Vg^(#T(W}}#TSCMp(O>M-=
zJP^3DFlL^Xt{T<M*M(@kDDKx0XRaF3Bi?evEMtgJxFq_n3-tG5lJei~F4WiDtS~g&
zuwr-YlApRtbzg{gO*%BG(pn3D4FE!O|1xa8dTkXzC$EX@>U;N{Xh~B@fHF?u6aIu(
z4u6{9tNv2_#qnG(s~&)@v$h_KzD+4s;!Tz@iQ?P4BN!7tVvt_?TYhS`YD{ZD#8RBN
zz5}w?x>V39QA+JsOXfpZmcTahj#B)f@0&>}GZ$f(Y{bhHDwTN)Dt;H_O556xma8;<
za_vR|k=>WCRI3W`MZ7#NiW}w(K<84N{!VG&=1oJ7WAzrM(+Qw$*nU?t&wcp=3QID4
z^Nen;v^VLBa<$It+6NRfn5(85i!}2|`Hy1cWVK%DPkyA1%Q)A&tyyEx&3E?pb89bU
zqUhG|`M>$~ln^F(>{!P>lLYKHgW$Q?e90&P7_ca!m%8o7um^2wmutdcYZ3T7*FY;*
zqg$0Y?D9PhWK$9_9mZ%)V+)s`M@Fy~h&!P8FA5RAKT6_65WKDx&_iuwr7|fi>KM?-
zoiqO()V(bZ6LL8&q2-c&vw$i(y&5*h&OHij1PVll)Z{7g-~FQb^O2Ww{9$OPH>(+L
zZ^$$Uhc92*&)i$e4~(I!0g5|==gK#HW6Z5NdZxu=3A{$QV~Whl+B8m4$?*lhh0#&9
z5FQT(T(9nxc~{rCZ!W3!I{_h{H8wLVi9ZU1(Zi;6^;Q+%jgXl$+EuKlBc7Xp22a?V
zlX?wPoVrM$Mxoa<2oQr=!oMK}R$0);f;_bnWd7^-iPAIch1j3!{HOlBIjSm-s=MJc
ziIomn@vK4fQP)cx4g251+$mn~G`wyp6Zx2uVBi$dk{}CAT|f!wYl?6GcDCY1UhtcH
zI2Y-!C&KW|Wo4THo$G&^5V6?>lpxC9In%OL<^cT@{aZbIE&ldppUvl(MIO|39)Vbw
zBl=>eoHaHh-vakE{VagHLjJ*dQo$nu=KuMv*8h%?7W!Yz@c#|(b=sG$3$E9G?WWq-
znRB;33?-J&Z^n%NkNXt<qnj}Y`qgRe>)vpQXJ_4>-PsIn)YFoQK;Ywf5S~?VwYTje
zcI(D(*7|wrSqu>d$PI=fdvgHdlRQ*_M7Li%{c>nXb^osG^Rd?*#OeHh`aLzRlGDcQ
zANU<p-A=|4k>tDo>P%F;`TV|1HDhn)rOGSA0w9%%#;W~;Q^4hKL#;CJ_HH)~Qb^ue
z6*ODsb?6vT=hljEVlxm)u-HwAjj4$5Tl(PZ>MBjARA?!_)C+3gXZ~+r_)}7sVbV}u
z#}Pjbe*1v#!2^F8AK#?EjH@`hjKXbgOqL&lA6&1ooRK8XigJ%Td6>KJU5gcHbBl^<
z&wo<UP7|s+J{pn}Z@M|n_t=>_58YXecz<-UK2o2fm=*7|)?qOlCcC1@nC*p>#*2rq
z9U1EylH4&T<8bktJQaP@wojZ#T=0^+IB!WYOULsk??y^z5bomP8E5y$ncv;k4i3Md
z)(LDDFrDTDk2hlcOAz_?y$D)mO4!+CNRra`RnT*(m3w;d)iWmk`7suQO+_AQy8)Hr
z*TEvSRN^W#w()hW!2Q?qKUAe@(i>-MWH~NN+rRbdz9+z0ur9IewJwptN{0%)69pR{
z-vr_uK8x^c%+JkwL4kZVbV*Mq*6>pGDl=|_<$~y=xCKq6mtsRPzdK&lWdziFqUEKj
zBgR?v5zrn8y}>v`kY%v4Ig<0@KmH}Qo<@X2Dp)=@Tzt6_XE~rQC)17aa-DzHIun4E
zl{X~F;Et?>zfawj%|g;YU^W`v6L+&e1~Q5DenTdzB4yuwSxM2J?T2t%2;sTW<F;IW
zoWw8Guk6|EL%JdyCbQ(^mxbuW1lA_>)0znYUT4`6yb;~cHk<39clbMqP4rFzWZXUp
zYQQ(BsvR~i{>=|x{T8i@8oiL&{b)d+eJ;AeBXunJMGYd6;9LL-+AWjgaXYr03=HY&
zi{O&-98ggqBgTxun6wv{c9|WVr*gn07vh;I^@MoJSP;(q@*fU9Eg}dP-psZ%a&@gV
zZ~eTns>l|CV4Uawox(qd4;mrfh>jt;QciiEK>%CPYmq2ApXsDzX7*ybliFE-<zEff
z+euU_KPF=$n@h>*zsqm=ZhUf01Y|DSzR`B8qmc+g%CW?o?`|EXuiB0`**y1u2@6lS
z*=aW~UgX^G`f)WHKqOnC5RZkCu`YHXq3`B?McCuFny>)8otUQ;2H3RgsS-?0grwfA
zVtb@IhGGG5sW_|MpAsJ!uDcM1Iq;Jqq5c4lvsMfP_gmvv-dDCn-+pMF9#MG|dU}_<
zcP~i6>8XUj5THF8SeF&q?<mkT2r@lnDXG28j1>WlX!xV?bv3Eg7~XkKVB&3~FKOOt
zQ(*wtsiVhIc+Bulne{y-y7cccxh{b|^Qv(vvi?ygzGOQ5aWe(nrRz)yJFx;<;lL5!
z?lL9Wu8rX@i9$cbx!wS=Sm7yYnOyc&Q1DG^!0;*S7!>ni)6gjR{n50=9^%@$Xeb5!
zSD{O??E~OZi}sZctmUXPA89PHTKrnc6sqK8;$Eui$V?7D9F-usDRAeT=OoEcXElH-
z=E__@FKP9D)1Kj|{Jyu3O|cn2?~c5~!0LExw95K?XMqZ6z58&Qrs=8jd@9<R6(j&s
zwEN(3>osd@_uA*N+q6Eo)1rn!S!^3vV*EZM<FCgD8ggRMTMn06e2lf^T~hPz!Dx9c
z)&|aPR`v#|KCMD+UqcV_)!A(5A?r?vA?vL5FpEJ)ngNe<W1<&$DZa$+-Z1|O>*y*m
z+m|O>PV~TN(i@05iJ~8@KbvV*qpNX7$EMtAJIN8@OVH*RmR^xeQLuO@ou(oI-eds^
zNmQkK8@y;UdbrKEh<jq4rZ{z=(vr`6iaq88&eEnWJl79wg-xG)xRVU_wA~Dff0AnM
zBAO;hb-UiJJ7|b%&1+a#*(r8m*uSLbX;!<U28-^ptk{B{Jv^ozgaYK%3#$qw)jJAS
z`f%dL+jX-<#71{ZCu0ksx{uU+%-vc-{supcrG9&yE-XM44#mE$U>JBhTyH-gsB7c-
zsSu3|M_w~|fm+TCd6qK$zF}IV5`e1Wqn)J}Awdb@k0+YqURpgN8dAN-A$1gR|JN<n
zT!tuyk%T>B@vb94I&@nn0onDqLGnFutJb^ta4T9K1HU843W%XC*at)s<iob>KEPQF
zuizN@{U`*lohadDIG9B<3s-b3K>lSav>t0@;hj|}_7fei%K|KYWyD1)-TwN?e$^;C
zRBx|@-?T_IMY#!p_B;?%c~>B*`-$cgw*yVXyIo`OCQlt}n&@nRxY%B;W4HUl!gW^_
z1PjRId+|%Hj5J;CvAu6FlB|pC{w)k8l^j_`KN-t|9anpKT&<<ddv9)}P)-e$4N-cF
z9C<y#<KpbT=kjzxP)Uw@>=rA&g!N)k?|Pqn>YZ$UlWg4*KMQC;W6`h~)Pk6{jey3f
zSM)YOH<dlDP9+iUGl@*eqI!6GJHVx5m0<bn<8qrvX*ml?{&$h0zaN}kundK)`k_6#
zQBARZ`cAd_zF;JPK3wP2(>22L#%1{*!6hI`2|YYDkSLL*UpQfM5bP9W5T|a4!LpS{
zZ`H;S@Otu!{%{<SP4*Z*b;EPB&M$SeI^56hs)<`Sv1D2qA*Hk`+4>;mmvTVICnbVP
zrf~GYB;!aHW~$N3cG)f|I4^QQT%9CbRftV1w=gE%Yq!b_=*r`HfSyL(c&;@nJCl#g
zB^UIbR=Zu^*RU?;GS+Z~Q)9uVe9Z}*k$Bf?2^K10j{-Icl8k!WaC6NlF<n}q(rHt}
zg(JGp%;LzLLHLx$k}mBfKelRu$h|9OHCap0S2i#=8nqTBU%S6Y8;wz#ozTYZE8j+@
z`Z-b=!xPdpx`gNVDX?wGoFi1^iU^QAJ$FHo0^dB@1?<m%wSvWHPC@yeBYMz^>F3oC
z{M&5=P?U5teEQc4=1_;I(=o4{4B|ww=}@~I4><vx)Hck<MR!7rUt3-!jHegMCP1@{
zxoK4)$Lf<h8r@nm7`WZKV<jL!se4faunt~)X4#tO$ZuhD$=XkoAOA(K!rjPM{Qj%r
zvKj4PZd_lP2fn<=mRV8>6EAW0;`l6ZxnJscWe3Nm;Q_g%3XBA#0NE{as)y5jIw@|a
z(`=R7*N?5>$-IYoeb`%@4puXqmj~?zG`Px>malI^ob&x{>EcE@5GvEAPjRxGlK35y
z(YdGuY~DiJ+Z61@!wZKca(U5rr7XqP4;xR#$!OMquxm#OA7N?@r53HV*NlSHNge4)
zPu9Eo;+-$h_P@UCxFB=kD}fHpSMm&kBqJfYo`1<!gXhfSF%E~zT+&W|6gwWq<yD47
zWTpXJ4l-`-%n^bm2;jI1KN8Bpww+v_D|YaOdDSHLj*4^rlb$T-A&SK5RN%cU%9F{{
zxvj#2ojUPK&DOZ@B)-zx;wQZwcys*Kx;BWe=Xp2LWVWC}*c@)3!`OoZttE$!bNBTG
z{kb|>QbVn-Y`^;zKZGA{Of~E|R=BG*%1XAH)3wPC3S7tJ(p4cJS`gabJ*UEueKut%
z?_$8qmk=IG2Y&A~$VY1>YgzxTE^~72Q}^%SGWDTY3FeP}G4e~tEPE&Y37r|$9~7x<
z>upFk?p8>+-=p<1zG;X|4p?(C9I~dB?+GCIfIymRdQ3m!n|`yFg8{4jE{2ms=~XP7
zFCqn>=Pko@%9?3HJ*4J_!?K*V8NMWBIS&%Brn!Uq+W906@5Xi69+*b8V+QWm<zXG=
zZa7*$g-lxCQc^XR6^*1tsG&w|!n%ZWaWWD3?DqnF1YW~7qP9erp`w^Hr%tR=v;0V=
zFj2jTS2wcl86@(8t$LkabhCQ=v-z)c%xq-rP;X=|Mn4E4nVH+Y%~F;-6NXeZ9Wl}=
zS(nnt##?uOUOe!Dre>ZF>wEc8WG5-}-a@YIRgm&smeIuLt3@HQ>3q}(eVTf=@1F4B
zL#o6O^r}v_!}$wJj{|xBZYB#iS92kT6^^;VdyYu8N%@W!GK6M-Y4xoa4k=3O7R|+!
zr~<KW7SNr*-L>TbTSM(p|C1{wy3GhmQ`j?Ls@FRq0WK7<te^00udPs_S0g%V((#%j
z6Oy-^kUu-4rctrhg`^4j1LJkNGh@X-^s@C4_^C{SzUUY;SRR=_iF>{auGvs8m~Ue<
z36Y`g{cyL+1VR<x8MK%J#dm+k3*$0Yl;ndr8Ke@dRwDY<|9oUH8frrNC9cx<c{<#j
zY_M*>`F!W}X%z)v82V-_^X5u%m}IJxrNsnhu=QE=*SebopJxj;C9yupmhrvk5%5FR
zvbnVP1)W?`?L^RKl##U*&F<}6VVo+%d5Yv>OI)|DxcKVLWbHn^(m-_D&P<0a2P1cn
z(W$CQoh$H@LrL~)S?EMK$szl$jHQ@`m*J9Gw*SeZm8MG^`RUa{BAK@AOnBo7bws7R
z-@2`{*9=+tmXjg!k#gd&xJ{@aI>~}9UL1nD&URM<UdG*nHv4wm{K0woVm=*S3g+;W
zL{4h4KJv*+vZs@Z!hNhPRVx$0?h(%U8DGb3ffBqZY{)F*PP+B9_dhIck{xy!vkyC!
zWI3+fFzsz|$xOJhSs8DpFEDNKC!7H*`CU~A4Yr7TSC7m*#b7&F_*U(QwxqU#9pJNR
zMec@4(v(He`6%mK4xubTxeuXwffRB)|7V~c&s6yJaPZY;^8E>u9fuNPJ|5zymJ>x4
z6&{46%cPAk0f)eFl4Tcv45>X|4j$0kZBL+7ym+|cj39+{rou?=w>)~Tcr4pl&;A@}
zG}!0k;e~%Li+j|j-Q>Y<w$~V*UV&&pz-665C2i|Cz&ZvejY!|lcq}vu*}8$#&&x>L
zlQ`+|LVroIm{u;YFiXqI^d~8VG<TohCOEQjul_u-hxc)ntX{HY`bFvqq)7T+Z~2-Z
zL1;|tNyiN$%{76aE}LNR8wL%q5Q9wSLE>aGXz&13R?n9<mudUjF8Z4FK`*O;U1LbF
z-s_!<(q(_lkzDN`-(unz8VD4S1AS)sA{&o1CVDJR-@d&Vkz*5+!1FYC1S{#mk(wdN
zN}em9u%_8e-j)BlDnpk_D;C+Vh%|f9K;S>+y`iLY;YcxAG1qC{0uz3v4b-|uc+#YQ
ztabvu_-9F$sqOyGd8RcTo4y0e_i+<sd1XFU4wAy$<tJ@Fo6dV*V(&dRGPke}T(0-)
zP<-kC=<O`SqH4RoucCwqh?I1Pqzcj@jUuH80s=}6-61fPbcb|}FoZPHjdaI=fYgw~
z4BZXGyV1-0y|3rf`{jB0#xcjtKK9z@KI6CkYyB6~S7H~7WTK~A(7L+16P=KPGGr2{
zPItc<FgDn`N1#T|KYwODKvDgOE}Z3V>C(xrbsfCS>$30BQqEYxY^5R47GKxb9(**>
zT<5^ZqGaFOA&%jIK45jRu7+IpyRz4g!#_N>MX4UA8FpaN3QmG`^1ZP(8ytS>=7Z&E
zz@>@_`&sLh0U4`%oR*&h=}X__sg~{@uzH>LIZrI8ZB4q&nVz%<bHnjCG-}qH=4xQi
zPD1s-uxF3w?yTU_54D#^aZlhse9EM)Q+E^!f^gZ`S8WtkSJgHTNL<X{rQAI`P9U9|
zk7i7>lboWxIvs*lhmzjOrA+oZ9Danb>J1mD6Ftyh?{mR7^0rhW6+7SFHu^5D66qd(
z&=5!qFJ3GnfgrM{y(^5KGw9<F@|>K{Ra=0+eRGB0C%I~nrwt#n#<eJE;R$tq-0OXB
zota0hn-@|pzMWs|0DS_KFdaZ|V$1{$X_hq8T$Pas=QPwg?yn5MCbpX>8$A(mTj}?j
zUj?8fu`>>}O+B;;Tzdr6uSe5Et&wMLI`S`pE`rkHmaxg@pH&g;<b|>FCIohAbHyxq
zECf>r)Byx8(1uu{P{2y(r9L2a5WyH*j<3`!h~uUnxMJ@KsB`tqgBnx2?Rj40<qGRA
zRaZRK59M?3Vr@saHTAOVZ;>>9G-(OKAaJaDI8<xByZGv83XV))7cT3j9kE2ZJ<4y4
zcd5VsKtIUCyRAaa?XGN`Joe@Xm4FA=b7qxI#*ren*`cC#Gi)!uZMoy}$^72R;Y0%U
z=!TB$Wn-zjfXC7Dm#y~{z;bi$<l<rzA)$Fkg_67zk2P2Dt{UINfe+i5qO*krRs!nq
z+m0bLrNCjU>2f^0_n<O*&YbvdQyP1us=7oqYfOsi?U4cl!0%=B(dldT^E-i$N>)Kt
zgp{D_HMm;=*3`9~h>YS#3Q=gh{cB>39_ee%+oqh_CfOD;JCxhLZ)<9@>TWs!=R{g!
zjmD?;*~gtz?U??8G~%28_ObY1v2VGoud6E#m(WDa&s}m;T=nV86|4+~^B3t+LrAdn
zY$YqYdRXN{^*n{d8D+NBTmcgh)U-m=CSU@R4w!%tDwKp=Tb%4=*KAy_>&weuZePj4
z2qa`U;9e5q(+`0t075`H8hZu4t>rJ!G*+dMp#!mqi#FO!2lVL>>co93ct}0)LU8^w
zE^x3)U%joyqcsY2KT&40$>bmLZ328Mfa_dePNZ98Lw)0I#G9)l0Z_BE@Sn&-!H>AR
zjk{4WwTaS?yGfle9Wm6z>};bD`h6VaYBv%#h(&e3(e7{z_Bj_4F;qn$=-kbjezQrZ
zp8xEu@i?;@sM^r3x6Kfd$51fg_Clti{8vY3Yt0=asVS))){E4xT703$KwIuDa8I%|
z&8yng98^~qbwV=BajRIgJaF*P7=$#?&EYp*?3uPpV##9E*S|5o`RM~e?MB(jbXC@@
zz(gc)#9;-!1Aq=}28(t^nH$wwEKf^~H*H98>@k3Z$oI{8in#3uP|h4P3~wR0a8Ydw
z*~n{Mogp*%+0MBSvsPrP=;Yf%?+YYgfn^T=8A9+1tBcAh_B;Z=-+h@dmnR^ukMH7>
z^kFTHb~YBP#DQvs8~Oq@E3&2Ffw^bA_%jbt79a1Wg&iG8s69CC)3BVvd}U6UKNOx1
znf7sxr=0K~&vi}M*Z2}RQ?{&+z4<yqj@CJ`obqPlRE7E5pU=RbD$oTb6xJdcfnlx3
zRbp1evVe@PP@j&esqkzDJA^%wGisu8<5%JG+bjPHUOBxXNm2Sk>u<B^aoU%1eLA$o
zS{G{tux6WjF7YoBapc8bXQ>W=*d1E!HcaSFm7#E+>Y~SIy4-yY@@m7h4|`aP_e74i
z>eHmgG5l}SOSn#%S!oJ!xvz7PCGRfq)~P@C5!F6NBy2h8MNJ4!ce^jL&hdjUowP{J
zRDabDO2iMQQ(x8HiNE)HCt#yW=QonGz{IDfuzJ@d+GKzWU{2>;T*332h~J<N)<K`#
zcMUYt1RYHBX(;%F`EIY1a@pHwf1f|Az+_+oq>M~JMeA@7p|aPvA9(ld^^t<#ByObn
zyB*Y`RPjxzuo5VceA3>c5O4<xYzJsqc&hg3s_Z@k0X7#hP0kcOmN|ClkPEw83q(4c
z4e8;-xv54Pq8HJb<`}ciR;*P@=XM&S_&(RS6sF85EVR7oIhxY}l3{Zl<B^L$kvh=I
zA~NsdPboZ-OdlfD-VXS+sRa;?<tByEUaYGnnu3qVR~>-ANGZzEZwZ@#84MUdATS9^
z1n7DFLxe+M3J>YO8Uz|;OITifB71!UIv`0j@|nKm5!E#(<Mh?!ZsgOhcFfynV8zX7
zaYFC5G#+<0TYdzf7m#KrA7Ur3fA9Oo<~Q@Q+<o|_Wns)?wH0^P3D6^+|G=2;ctnA_
z_aO=CvOZq>vg$#(V%%0B^JHSv{ntWmG`XpZQh<hT-8Sqi7U25P@3n|?Jl$SCXiu*y
z2L>c`56!&Y4r{x^gw9OKxLpt5lCgZmyhR<<QPQxuHv00E?BzF6x~x<e3az~o(xO6$
zNVrB1SB3aMed;lZ)P4y~(2zukdc+w4#d0exzm<Ik8^7x~kE#l|@<7Xy;FQXstLii7
z<}3K$sLcxjuyO)?l%zPyL%ZUu;ENV0_X=v(?Uk1ojKIVvUu<2TlH8Ze@d@1NM?zfI
zYqY9b_;hJ?maOEnFN0O@dMOFoEjGUD1gR?~%*B`yHg{O;(2jh#tj$(@{{jkG^^Z!`
z3nU|3y6p?28(f}pZs;+K!e4#+GNpAP^0gZIWYFZi8uUHjww5zuz*IOz{Jx>>d53&5
z;8Aghf7w-uCbcA+$G{y>)+yW|DIM@uWc)X%<MlYEBusf3@)y)u_9qGPil;P-S3gLP
zzG%6B(jYZ!3YGuAfG)->?4>b103#5hvBPJ?W#dZ&S$ZDDG6ieMYceMVw0woE=nkHT
z%t-C?*huvep30;@dDAuDoZ1%A!!BUtvr*R-?l70M+3teB_$*2(XcmWl4}m@%=*3A>
ztxq3JCAivODljRT{OFuAYhz;)N)p|$p3tz=r=xOyciAk6dYWBoI;jByg}ae8zAB%V
z{te=eHN)+iPyBI%C0?jaw?x=dO`6`L)cUeoNr8PYC;jr+C4#8ITRr42h+ADYL8yB>
zCU%;=X{@CI;aNztrrODY$26oy@O+Te+U7HwKq1r!lhxwlshUiivo)(yn`f8ccQEu8
z$V%iGG<1`1xoTzhD?Llva;&(?6LkyhcXHST;+FtpGgS>r=@chdIo_(Tx3yYLFM6`L
z0|@SXVX}zt{T3%9-Fpo`PDPi;gCECiYIf3ph1SzJggIDqzH$T{E!uYcvx7VPd-uLc
z6F7a0!2v4HrFvzH_{>)w)F#(w9CT~SV#!1qU8xOJ&rhSB+8R||{bKj!qAF=@_yJT(
zN}($uaI1%_kS1RP!m_F)M39ZLSBwEB=V*B$gA&3m|A;1`ca}LLAi(FYeDkH0Xm>jm
z)-N?Mvef;vYCW%dQ`NFBXt&wn#5XzPhyoEZR|wvGY8+CZusu=Y;;aLmGx}+{SFFDl
zT#_t~EXwr=cH3Cgc%7GKw(Q_HUJul{GNCL@o1frZ8S@CA^iqO%TW<QHf!0TNi&%9e
zffwS}{8&!!f@>B-8&oL~Q_AR!dUW8|30^=4lq*2V2TEAdUYs3(W813gU6US#mn)(0
zBw2a{&wsVgGa0>436VIA#WkBLdQD5BlD7{D4IfS{Q>G$i)ib(FL}@wgg`?&?Sblpr
z=iob*dL^?DAB8nj(ZPioqght?uH?)^jKZWtJVHvGC6{|-y!elqEctxzc0LY#xSEOK
zJlrjb+NW^sRZ_=HGGu#`RHos2R5=kJ-p={e0#i;v5A4{bkn+~2A4c!^RRj4oUYv|1
zJvyN9A}mFqzQF`SM4OIl$-}p^&%=?ihy4f{PG=zow_JlEIr*TT*0*DHoNCANRra}&
z8N|BQa(bK5(V9Z7g9eW%hg*JBNfMwOe^St^_+EISf*5;;0x$x%sV-KC3|s<w6UcEd
zOv=eEaj*j?ZGl$VYM3VjmO6WWpv82dsXQo+6u{)hPk`Y8cVpL<F5jHxJhUdQ7rRCx
z7`jNbGQi_B1srV9_qZS)Ui&F*YZE+9RcgRV2zW=-Bx|1qlj$yxn`F+j36p3iFVxu~
zdf!tJ?zb<g8TE4Oxd@xIr;&Q;t)8iN{~>bXA9g;F-7;gI2-*_-_?g29eQ-d{s_eLs
zW7G7gOWvm}yptu}<A|R=B%QO{Q+iw4a~|l_X0-58eKk$T+O7*=Ep-?}9C)v%lFb3C
zX4~2ER<l;H$9+p6TvAL-8EfOA$H_wR{Xp>&7<O&2<1oi^SowcAo(IKBcxsMMKNdcv
z2K;{MgE3&KtO0Q%WVKHZzauk!WH71t+ai!#1Kn0ZqGj>>@EG8&V9q$BddablgfrBR
z6$j>z<%V-2$4psk5ipu(nN%>JC3q0Vbby+x$tOPC@|2N{!3IRim>w?*D=IMUIS|{*
zlQNV;!J+y=#IQ4qjnw+AYP}e4+*x>l1n&cn6^gAVILBeqX%-_?*}(o^q}9%7zTwBd
zJXA3ovj<Z^<s0z}ELj5=r+cM_+jV^d&iPp=SMP*4!khcO_9u+u;>L(nzMfg4JJFaE
zJVyK@KQ48^RPS-C0)Ku@b8-HNS_z&(UX!;L6Qb`%3mLXifm9mrc4}^!>CkAqHIR<a
zYYYE)3?34LhBHGMdMGE}mk%f;6P`5yOb_d!8|nuBhp=z}T)kGK414t;x5Rxtfh$zP
zs$*P8)15<s%Y$3E!JHWABlq%<VW@+}f0>c7uEAp<XR!>hIgsO0r=dqQ5LV>V5CBXM
zKO^bTfiY?(e?q!)?F~8s^m}IEHAm>Pg|o|}=V@&i%wrqEfGOm^ksVGrk2)mWWIeAt
zP-C(l_13hJ67U;iRBVRrfaG2)+vdYOSvJl7!F8?^UtCAjA{c4?43xjfkrzJ~-aw;&
z;jqTWc?T5JU@*oqmNdhaq7B!$;b`-h)+xGA%?(HQG&~QYaq%o3*LbC5ZqV}M*|dd_
za9^ltCg2uGX17^Tn<><&OdIjwRuzx))2;tOXx)g@M?d(>)WV06Bt>oGuP4fx?l0YT
z0~!aAKhoe2!ll;Q?;zW%Zvi?La5BcmQFMtO)Q%-)3>?_=qJ5sWxirs25pYUoi(V{U
z>_c1XHx>tZR5rXm3=h9$clq=7XObL#x@LR%Js8QrjC{9;>lM%)W3&(<$`is_&1YUI
zU%9Li?$!sp*?hT4D#l)^^UIg>yD5{_#-J#I!<{P)Sn}K!726IbO{>yF;G=Br0v2Lg
zMR2_D(-uAv&=mU1PChnPvj~rW^Sce~F10Cje&V@UuG$Puy(oa+z5KAw$wB^5>xF~c
zlhC^gxE*)g<IErA{>uLB|Maz)uh7qX{33qKD8eD6Ath;yr?w|$&r8s6I5*wu^n$0z
zBlm|^n=vD)*scS{6+)ctz*!&A&1skP<9X=8sG?lUM);|#Ukc&o%;ju9XOv!wO0~i|
za&x<~Vh{%uHjbaHuRgFpRt-3@c2{B&+Bk0J5%?S?$}H&_7F$XqYSn8EpyEDP8-)Uu
z7f{&YC!6m4p-RA!VCa1U=yHaVsoJ)dP(|#}tjJ!EV3V!7@RW=}fI}d_qokTD8sF^)
zr~9-^w1-hmliE9)pJgKZ@g*CTj==IHwS+qcGW7={=VM9naeI73!gJ{L_ITN}G(d=Q
zB=xk?R)%)=fp&65^R|d)AajS+{t<G=*f9Aa7F<})%Cz4UoVWAs9-#v1eU>;%CVjQL
zmhWZTda&<>Z01^os78M8Z+vb0t>)3YLRwJZAyZb@vro*EA1t~PpIC#O>6U3O!~)sg
zso$F6AaQ>x@y?;Y)0wY-1E*u<^ARWUJ2?g)!90a-i>;v%x)N81JBqhk*r`X(Jlg_L
z-Rs2;NFOO9_{Tnp^d!D|0DT;LM_26BB4?gGm*%ruQ$Ox6ykp$?v-^{@%2vx3bjsnx
zPrL*rrePArrOI+?e;Z2~vNgzP*c)AfRaMygjf55v10#$#&d}+0@pwTH&9%!sVFq=7
z-(?dghY6%OP>(Ce1M9wk1D0*PVG2u@hnSS}=Z7IJ+j3=vlD{7f8<3EOAAW)x!9d@b
zBQ?f`0Mm!VK0HG{MUT4~hz3#*N$bO9eXd%BZbbiztVYAb0RG4mL42OErLYeI*ISAL
zaBal8ma{>5(J-|Rn%KM~ny3BEfXTKZfT;aC$?}JaMn;|K+9Rw;v^Hirht!m=%Es$a
zG`qVxmE>aden*ty3+EeeJmuCvTS-+zdU73CL7^8ZZ$hdcTmu&uCnsG>uj1Zx;H>XF
zaJA=8HY4|D^A@F`XSGTAbZTTLuH=TGXG4l{`G)?L{mbuWhvqJuzm_6hCg`$;&}W)1
z*6mp@l)DRgAp5xzwGQ={8=yhM?#d$;A0O$!x@{^B@sl42Sar5kOOwQGwiN%~ysvIu
zDywcYBWW`CP^*a}U$;nHtizktTJh69{i=F=dDWq&bGbHPP24T>3;V<J8UU8}<cvSv
z`R<igvp9v<THY3~g=F)mBdy~}I<HSG>HdyAZ8xO@WGob2yDQNwNnqO7y+n7P$@w9k
z?Rp-bt#47lKi~9BpY+irrS>&uW;6_ZEy@XHymCgZPL}md&Rx+ox=iS9QTT#Zv~ytg
zUi}etjT0pePn#Gng)k$jR>N?O_I4px8+*(LuF?n%f=z9B*;7O(r7q1`$>B5I=a_u}
zU*ZhC-Y1tmC-|f*+Q<2Y#HQ$klV`TmjTz&?sePgzbDF67&xV$O5HC11vJ+IztPWYv
zh;vg_N?5Jg$%hT32*~R<pBHn0y4l0uIw0i?fyUq{c?`^&q`MjfCw{$*S*d{!v>^fG
zONUVjVCj7V^B(BiLkGZF<kEhBx+?07Pf@5uRzFH-{K8k;zOS4L)^b)d0&@I-UW!Z*
zIan6sr>X0->2b%VAAs-TREm`MCb-Mmyj$d3{DG0iB^T&4yV#MmQQ0^oHsQn;EpdWq
zuf|);_;#e7eu(SWPL??o{__o6zNi#VrD1uDe3KDSq9-c<?6U9o**7C=jK}O6Ea1BX
z1C8p!M$gM*@<nHp>T*}>>)C_JFDi8oX2iAB8~?B%5>YFohXNZa&xoa#BYRW4GuLjO
z-@iak+sv}P)Thj|Vqr&azR2w^Dv5K56M$i7X?9%qYdam$woTki_B5gVZs%Mu^%K4(
z*<~HU<##_*Jh5t!4Vo$^b)c(0=nquC!lgydMr6rkA!6uHI@Ngq^!iKj00ap7|6wNK
zrKvelxr@xFx~QL%T>?n8>DWvy48Y+_<%>UXxr2@bPnS($eLP(tz-fg2+PK;SFs>Gh
zo|yv5fB698>hIS+$W7R&BAVMnf)uXZ^st&QDiO}<e2>IOj|KM#yn+T#krL3Q?OImx
zH`IGe-oTHt0PeIzGL1$`ng<@j84bZx3Iu2TF*fcDwUz&cN1<TCVSvjeW}6E-d!oA}
zgt73tl7=K`FAt8Up<CY#mpIDG7cY;Y&mdkjMLKnS+Cm^@aFtl1{Zcqd+FQ0*gc@)*
z>jLc?ZUe>-oPo>H&Jx{0`xk>^%nL3?JvPot&n7c*uc?=ik~pn1B5t=NbJDMy47rx)
zb*`gj@;)*>M~y@LaoYEj;hP5|T~u{ufwUzZB>7&M4^K8*P;L03L)K!DpFC@L^`5;-
z0v#aP@;_mzNY2^}RHC0QaRMBx+4OG{za<cEwUfcJh3pT8Vun+ZbGdF-nzoFp$QOv8
zGEq4ERD*qYnbUQ_ve|6)hm9griNpYK#Xab3Fga~ge}Bj@1_q>CqC^+TDLY&&ChEZZ
zk=f;-u4Zc=DSIH9ly{8Ny_KkA<5afn8EgpXz7mX6{P4x<hP`&?QGI0kj#!Yc^iP>O
z&TPqwT&JxIn);i<B-fZ~PZvEXvgOw6R8~$1lzt9gYoq>3$vRyt7TXA_VM_RG1kbzZ
z3edp@Wq`+{oLaNzZndMc`1}n`kfh3Lxv5x;4)EN9O$;w@Jf60hkD|BkxX~QE!T{Kr
zg9%lQ#8B8>u<l=kd%Ks%@;v(XFAn7L7|;Gnx+vGE9<e*nf=ex9nL*n3C?(+jj;YXr
zlv$*l&%KK!U-#{BugOKL>?m-xbs7hs8C^Y3x+_ca)h|Qiq$c~-Y->QO1cO%FVG`0(
zyO{(xIxhIb3OR~xf2+cN@SBBp5;5o}>gF>^aQ1XAD+aY;9SI_c$)rrd?*%L)#Zv!=
z9PByyuG5#ccQhh;<tPXnjh1kZAR~-xP1Y#IQ9ERX{?F(np`CGvq&&&+;GZU_CvX;9
zc}NC)_FuP4s3(k~;P3Yj7+_Gqh)m}a`<S07QAuIBmPl=;Sa>5hj4NfK)R?p9B+Ptu
zPv<F@&QXWgJ+w3hdW2^2rL#e^=e8Kx(=z1Jy{Z_W>XSIlMP8l70|;~~R%m25cOpBR
zx)lJT10+;bBEWpkAzm*g2!=N-1e{FA4_*Wy`eu<WP`TRsiEnQ^9(aK0AzzfCQOIYm
zwoUO(L7RXZX)<`6OKY)pTfo|p9&jl*vmT_KZ}yhXi`fv2T#7Dx@>{`GgAQJNQd&PP
zM8BH2bvbuM4Vk4WXx4}q{$3!C{^bF80_1HWD~$g{q@wR0)p-@fs-x7T<<|d*25dxN
z&XJx{Ye_ZlnZ5r~7U=3SZOKmy$B~7g?qu;~f-7;fXP`Il#%k$>@rj;$Ek4)8QX#qB
zuq4cncQB}A>ZL**{Z50l%QP1t(o9$UQV|@AoHKbec)nd9#fNuJ-BAHH6vB7EXX|xD
z^<yJq8IB>Ss=!)HY}pT!um2SDfo_jBmB*}^6<3*!Q_=4&#B)t*vGZN_s7>Dido;q;
zXWzBEh$v6K3B^X^VsglNK$Ua<!CchqN$+eNWK0}FEs$odm5E4MV%9%4RNIW{P=%Px
zL28k>(9epYTZiqH&4t?=KH8olU`CWFXz3I|U!jL4QNIZLxk-zpuNMP`uciR3j)1ys
z*FYN_?-<^Zzr(A5J^FQj=-_dD+BJuFvHn$K$IWNC+B?Ob4v19RaHIp{*Kr^z`~ynT
ziVtF}*)|%Nb5|vrcTeA_)ZUlJ3c-Oc8hfA}sDXlc>#Qh2PGu9PdB4+LyRNt^#UKNR
zbY^e<#t5;mBk{K%uqv~lefRwv&A?q6jitmmtc0g#clseyAp9rA(pVd%YJ<bbXM3?J
z-@*op+sOOGrOHbht2Tc2-KzWexF9Ua0QEJRUlBVADvf$Rq7}!abR}b_C2A4>#iBBT
zbI`N6Wi@PYH_7b{FRo7DpWMz^DbGSTK()%}N;lWOGs<}WGY2YN&w+kzx3D@D0Tyw@
zkRdJK6*0(QbD&TL(1`wWx{*@ydz|4PPal+<KL!VhaG@JU4l~LJU|xaLGsic5vFh(D
z;L6^f<}m5PAxe!7umf!f+GXMjc<d_)i3`K3BzM}&hu|#jYVqop4&yg?9pJSHQWw!@
zPWd8<lfLDhbA~xI-E-HZE!~INZ0zCB(Iv+p5ip?lA^*lb4?QTMJ<;k{O~86|QonIi
z;qf_kBc;aDrcXC`zVsskuaqNN7P$4Dw4N7iSEwKf+|l^c2$5ALvXF7Qe_n!n_YEY5
z2|irOOj;Mo{(162*H4}igVC>1Au-%{^p@?~hi`nhOemx92g%`6?S;vIaDn-9H+eau
zr5B9}$X1<VmP4c($UPtXeO{#773t!a_C2pY5v(D#B*>El{2YGM>W|E-;JpCfA*%k3
zn~Q}4HlMb7faVPN;wjYU=ZlsXD=8<V8t|HxWK;%Y#IHfZ`@dNM55F%y*5kBL02MqP
z8~x#~lG;>Us9(j2t{|DF<v1OefS8}LhJ>fcR=Jkzq$jtVd;~<l6`~^FElzA*tWU(x
zYg8*R{~75IRYy2B;A8v90$#lvfCqdm&#jPeSkwr?y$m9A<u40B-{Drd=fVwEtKW%~
z*+imkU-8)!q+TEG$&ENG4fs`(9oiF*ciOm(;={R++SkefzC!50C6VS{X}FI-;k$)a
zS|_L4QawwrM9yI|kTC5ab^0{F2>&Nf6Q6m@odo9WYXIW(3od!ciL+dZ9xk8rEM}-G
zlYEcrPUdN{ox>AFR~;0_@P3O2mM&j>)h%)b1>vSmJk{=T6V@rrb-!-C|J==2D|FW>
zvi>c0=HWl1RqcAT##UwBS!xqb3!nNC&v)Ty$1sUzbKUg$vU2d0F|?vzdeUo{j*Ml&
zMY!ED%<5o>${aJrQrdp}^@w+Qb!qhVAsehbxL3CQ@XL5Kf&a;c@_8XS@1lNHM^62D
ziLDCbfvc>;a{-j-Nn%8KDm_Qe9NJW1kUlk}XVUpc=hl3){{XA{mCW~3cD?lV^*e6z
zvq92NR-fm<{gy}G!rn7gAIaDg6?q>eTQQpM%dSWN-iNVe(j2&U5vD2g^O*!c?5j>Z
z3S(UTRln^_Eh`)?=ve0craed1r3;_#=;b2_2M$Hz>6cf>KY-+=&5BXa=eY%DZuotW
zqAA#Nj=|(vH1}!>W1v6-bDHoteGYHL5=#=T%^bL#ciA?plr>fiH%05*UFJJ+R0Qu%
zJvHY5)X*x5hx4+m<`aI?m(EsXdT7bit!9TrBCMoIp+3-hg~Rro&9D2^uCq=Ei;Gr`
zRiTUUa(W;P+fRhv#_(Vn2W)FZYzzbe`MiRXx-0UdIrFp6SP*6Gvk1}XP59Nm1b5SN
zlT22d(*-}W>3p$#`T?*T`^5=J1%Uy-aR+O~@#y2)V?kDvX3wp1Q}I7r6OGcj3NvfU
zTYCL575=jO|B93HeI15?QNIYfh%CImg!-gAHt(I@f{g`9Bc0fN)XMg1Pu`X_ya)>i
z+p%laRoU^K=NtKh7MdLmf<v9I%xpl07+g9J<m))8mxNP=0r5E*Ao0DU2XZwws3LsK
z5o~5}{btc_>3!-eR+VYC#PwfZ0ZEiIP{g4@iLXlfzC?T$A(@S;9ex8AjcuA6ttaxa
z{Ec5gq=Yx;`+h`N+l($%AivTjzk07{4NqMK;`A7ZQwa|)hYJe#EW9B`vCF&zv_mTT
zr6f-AfQNhzA8^k}eI+Pco4_XptW=anmdY+|dN-}pG$6*i7Oj`$M46|*^WrSpEh8~B
zAElx0fSfycC`99*4UEix^57(LD|RvSJE};npw7%az}IcKIvP9;__|%Mbc|7YB)C0{
z)QC{;|D10Aw&uwv61`S1{5{Axk^*H!fB(Uze;xhbA7(LhMgM8%bNy`v*$Bq}d=ESN
s-=#Yw|5i2pZ*;Hzf4?AcChF?uJ0TkW_Y}o}H-NtvvdS{WQXfA59}BFoegFUf

literal 0
HcmV?d00001

diff --git a/src/External/Directory.Build.props b/src/External/Directory.Build.props
deleted file mode 100644
index 4536bdf..0000000
--- a/src/External/Directory.Build.props
+++ /dev/null
@@ -1,8 +0,0 @@
-<Project>
-  <PropertyGroup>
-    <ImplicitUsings>enable</ImplicitUsings>
-    <Nullable>disable</Nullable>
-    <LangVersion>latest</LangVersion>
-    <IsPackable>false</IsPackable>
-  </PropertyGroup>
-</Project>
diff --git a/src/External/RawIntrinsics/AVX.ManuallyAdded.cs b/src/External/RawIntrinsics/AVX.ManuallyAdded.cs
deleted file mode 100644
index 0a7ee43..0000000
--- a/src/External/RawIntrinsics/AVX.ManuallyAdded.cs
+++ /dev/null
@@ -1,25 +0,0 @@
-﻿using System.Runtime.Intrinsics;
-
-namespace RawIntrinsics
-{
-	public static partial class AVX
-	{
-		/// <summary>
-		/// Return vector of type __m256d with all elements set to zero.
-		/// </summary>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_setzero_pd() => System.Runtime.Intrinsics.Vector256<double>.Zero;
-		
-		/// <summary>
-		/// Return vector of type __m256 with all elements set to zero.
-		/// </summary>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_setzero_ps() => System.Runtime.Intrinsics.Vector256<float>.Zero;
-		
-		/// <summary>
-		/// Return vector of type __m256i with all elements set to zero.
-		/// </summary>
-		/// <returns><c>__m256i dst {M256}</c></returns>
-		public static __m256i _mm256_setzero_si256() => System.Runtime.Intrinsics.Vector256<byte>.Zero;
-	}
-}
\ No newline at end of file
diff --git a/src/External/RawIntrinsics/AVX.cs b/src/External/RawIntrinsics/AVX.cs
deleted file mode 100644
index c10c3d8..0000000
--- a/src/External/RawIntrinsics/AVX.cs
+++ /dev/null
@@ -1,1336 +0,0 @@
-namespace RawIntrinsics
-{
-	public static unsafe partial class AVX
-	{
-		/// <summary>
-		/// Broadcast a single-precision (32-bit) floating-point element from memory to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VBROADCASTSS xmm, m32</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_broadcast_ss(float* mem_addr) => System.Runtime.Intrinsics.X86.Avx.BroadcastScalarToVector128(mem_addr);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" based on the comparison operand specified by "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCMPPD xmm, xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmp_pd(__m128d a, __m128d b, int imm8) => System.Runtime.Intrinsics.X86.Avx.Compare(a.FP64, b.FP64, (System.Runtime.Intrinsics.X86.FloatComparisonMode)imm8);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" based on the comparison operand specified by "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCMPPS xmm, xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmp_ps(__m128 a, __m128 b, int imm8) => System.Runtime.Intrinsics.X86.Avx.Compare(a.FP32, b.FP32, (System.Runtime.Intrinsics.X86.FloatComparisonMode)imm8);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" based on the comparison operand specified by "imm8", store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>VCMPSD xmm, xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmp_sd(__m128d a, __m128d b, int imm8) => System.Runtime.Intrinsics.X86.Avx.CompareScalar(a.FP64, b.FP64, (System.Runtime.Intrinsics.X86.FloatComparisonMode)imm8);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" based on the comparison operand specified by "imm8", store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>VCMPSS xmm, xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmp_ss(__m128 a, __m128 b, int imm8) => System.Runtime.Intrinsics.X86.Avx.CompareScalar(a.FP32, b.FP32, (System.Runtime.Intrinsics.X86.FloatComparisonMode)imm8);
-
-		/// <summary>
-		/// Load packed double-precision (64-bit) floating-point elements from memory into "dst" using "mask" (elements are zeroed out when the high bit of the corresponding element is not set).
-		/// </summary>
-		/// <remarks><c>VMASKMOVPD xmm, xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_maskload_pd(double* mem_addr, __m128i mask) => System.Runtime.Intrinsics.X86.Avx.MaskLoad(mem_addr, mask.FP64);
-
-		/// <summary>
-		/// Load packed single-precision (32-bit) floating-point elements from memory into "dst" using "mask" (elements are zeroed out when the high bit of the corresponding element is not set).
-		/// </summary>
-		/// <remarks><c>VMASKMOVPS xmm, xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_maskload_ps(float* mem_addr, __m128i mask) => System.Runtime.Intrinsics.X86.Avx.MaskLoad(mem_addr, mask.FP32);
-
-		/// <summary>
-		/// Store packed double-precision (64-bit) floating-point elements from "a" into memory using "mask".
-		/// </summary>
-		/// <remarks><c>VMASKMOVPD m128, xmm, xmm</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_maskstore_pd(double* mem_addr, __m128i mask, __m128d a) => System.Runtime.Intrinsics.X86.Avx.MaskStore(mem_addr, mask.FP64, a.FP64);
-
-		/// <summary>
-		/// Store packed single-precision (32-bit) floating-point elements from "a" into memory using "mask".
-		/// </summary>
-		/// <remarks><c>VMASKMOVPS m128, xmm, xmm</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_maskstore_ps(float* mem_addr, __m128i mask, __m128 a) => System.Runtime.Intrinsics.X86.Avx.MaskStore(mem_addr, mask.FP32, a.FP32);
-
-		/// <summary>
-		/// Shuffle double-precision (64-bit) floating-point elements in "a" using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERMILPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_permute_pd(__m128d a, int imm8) => System.Runtime.Intrinsics.X86.Avx.Permute(a.FP64, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle single-precision (32-bit) floating-point elements in "a" using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERMILPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_permute_ps(__m128 a, int imm8) => System.Runtime.Intrinsics.X86.Avx.Permute(a.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle double-precision (64-bit) floating-point elements in "a" using the control in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERMILPD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_permutevar_pd(__m128d a, __m128i b) => System.Runtime.Intrinsics.X86.Avx.PermuteVar(a.FP64, b.SI64);
-
-		/// <summary>
-		/// Shuffle single-precision (32-bit) floating-point elements in "a" using the control in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERMILPS xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_permutevar_ps(__m128 a, __m128i b) => System.Runtime.Intrinsics.X86.Avx.PermuteVar(a.FP32, b.SI32);
-
-		/// <summary>
-		/// Compute the bitwise AND of 128 bits (representing double-precision (64-bit) floating-point elements) in "a" and "b", producing an intermediate 128-bit value, and set "ZF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return the "CF" value.
-		/// </summary>
-		/// <remarks><c>VTESTPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm_testc_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Avx.TestC(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise AND of 128 bits (representing single-precision (32-bit) floating-point elements) in "a" and "b", producing an intermediate 128-bit value, and set "ZF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return the "CF" value.
-		/// </summary>
-		/// <remarks><c>VTESTPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm_testc_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Avx.TestC(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise AND of 128 bits (representing double-precision (64-bit) floating-point elements) in "a" and "b", producing an intermediate 128-bit value, and set "ZF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return 1 if both the "ZF" and "CF" values are zero, otherwise return 0.
-		/// </summary>
-		/// <remarks><c>VTESTPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm_testnzc_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Avx.TestNotZAndNotC(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise AND of 128 bits (representing single-precision (32-bit) floating-point elements) in "a" and "b", producing an intermediate 128-bit value, and set "ZF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return 1 if both the "ZF" and "CF" values are zero, otherwise return 0.
-		/// </summary>
-		/// <remarks><c>VTESTPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm_testnzc_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Avx.TestNotZAndNotC(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise AND of 128 bits (representing double-precision (64-bit) floating-point elements) in "a" and "b", producing an intermediate 128-bit value, and set "ZF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return the "ZF" value.
-		/// </summary>
-		/// <remarks><c>VTESTPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm_testz_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Avx.TestZ(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise AND of 128 bits (representing single-precision (32-bit) floating-point elements) in "a" and "b", producing an intermediate 128-bit value, and set "ZF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return the "ZF" value.
-		/// </summary>
-		/// <remarks><c>VTESTPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm_testz_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Avx.TestZ(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Add packed double-precision (64-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VADDPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_add_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.Add(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Add packed single-precision (32-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VADDPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_add_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.Add(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Alternatively add and subtract packed double-precision (64-bit) floating-point elements in "a" to/from packed elements in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VADDSUBPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_addsub_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.AddSubtract(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Alternatively add and subtract packed single-precision (32-bit) floating-point elements in "a" to/from packed elements in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VADDSUBPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_addsub_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.AddSubtract(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise AND of packed double-precision (64-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VANDPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_and_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.And(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise AND of packed single-precision (32-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VANDPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_and_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.And(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise NOT of packed double-precision (64-bit) floating-point elements in "a" and then AND with "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VANDNPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_andnot_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.AndNot(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise NOT of packed single-precision (32-bit) floating-point elements in "a" and then AND with "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VANDNPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_andnot_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.AndNot(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Blend packed double-precision (64-bit) floating-point elements from "a" and "b" using control mask "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VBLENDPD ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_blend_pd(__m256d a, __m256d b, int imm8) => System.Runtime.Intrinsics.X86.Avx.Blend(a.FP64, b.FP64, (byte)imm8);
-
-		/// <summary>
-		/// Blend packed single-precision (32-bit) floating-point elements from "a" and "b" using control mask "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VBLENDPS ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_blend_ps(__m256 a, __m256 b, int imm8) => System.Runtime.Intrinsics.X86.Avx.Blend(a.FP32, b.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Blend packed double-precision (64-bit) floating-point elements from "a" and "b" using "mask", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VBLENDVPD ymm, ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <param name="mask"><c>__m256d {MASK}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_blendv_pd(__m256d a, __m256d b, __m256d mask) => System.Runtime.Intrinsics.X86.Avx.BlendVariable(a.FP64, b.FP64, mask.FP64);
-
-		/// <summary>
-		/// Blend packed single-precision (32-bit) floating-point elements from "a" and "b" using "mask", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VBLENDVPS ymm, ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="mask"><c>__m256 {MASK}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_blendv_ps(__m256 a, __m256 b, __m256 mask) => System.Runtime.Intrinsics.X86.Avx.BlendVariable(a.FP32, b.FP32, mask.FP32);
-
-		/// <summary>
-		/// Broadcast 128 bits from memory (composed of 2 packed double-precision (64-bit) floating-point elements) to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VBROADCASTF128 ymm, m128</c></remarks>
-		/// <param name="mem_addr"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_broadcast_pd(__m128d* mem_addr) => System.Runtime.Intrinsics.X86.Avx.BroadcastVector128ToVector256((double*)mem_addr);
-
-		/// <summary>
-		/// Broadcast 128 bits from memory (composed of 4 packed single-precision (32-bit) floating-point elements) to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VBROADCASTF128 ymm, m128</c></remarks>
-		/// <param name="mem_addr"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_broadcast_ps(__m128* mem_addr) => System.Runtime.Intrinsics.X86.Avx.BroadcastVector128ToVector256((float*)mem_addr);
-
-		/// <summary>
-		/// Broadcast a double-precision (64-bit) floating-point element from memory to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VBROADCASTSD ymm, m64</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_broadcast_sd(double* mem_addr) => System.Runtime.Intrinsics.X86.Avx.BroadcastScalarToVector256(mem_addr);
-
-		/// <summary>
-		/// Broadcast a single-precision (32-bit) floating-point element from memory to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VBROADCASTSS ymm, m32</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_broadcast_ss(float* mem_addr) => System.Runtime.Intrinsics.X86.Avx.BroadcastScalarToVector256(mem_addr);
-
-		/// <summary>
-		/// Round the packed double-precision (64-bit) floating-point elements in "a" up to an integer value, and store the results as packed double-precision floating-point elements in "dst".
-		/// </summary>
-		/// <remarks><c>VROUNDPD ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_ceil_pd(__m256d a) => System.Runtime.Intrinsics.X86.Avx.Ceiling(a.FP64);
-
-		/// <summary>
-		/// Round the packed single-precision (32-bit) floating-point elements in "a" up to an integer value, and store the results as packed single-precision floating-point elements in "dst".
-		/// </summary>
-		/// <remarks><c>VROUNDPS ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_ceil_ps(__m256 a) => System.Runtime.Intrinsics.X86.Avx.Ceiling(a.FP32);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" based on the comparison operand specified by "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCMPPD ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_cmp_pd(__m256d a, __m256d b, int imm8) => System.Runtime.Intrinsics.X86.Avx.Compare(a.FP64, b.FP64, (System.Runtime.Intrinsics.X86.FloatComparisonMode)imm8);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" based on the comparison operand specified by "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCMPPS ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_cmp_ps(__m256 a, __m256 b, int imm8) => System.Runtime.Intrinsics.X86.Avx.Compare(a.FP32, b.FP32, (System.Runtime.Intrinsics.X86.FloatComparisonMode)imm8);
-
-		/// <summary>
-		/// Convert packed signed 32-bit integers in "a" to packed double-precision (64-bit) floating-point elements, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCVTDQ2PD ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_cvtepi32_pd(__m128i a) => System.Runtime.Intrinsics.X86.Avx.ConvertToVector256Double(a.SI32);
-
-		/// <summary>
-		/// Convert packed signed 32-bit integers in "a" to packed single-precision (32-bit) floating-point elements, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCVTDQ2PS ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_cvtepi32_ps(__m256i a) => System.Runtime.Intrinsics.X86.Avx.ConvertToVector256Single(a.SI32);
-
-		/// <summary>
-		/// Convert packed double-precision (64-bit) floating-point elements in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCVTPD2DQ xmm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm256_cvtpd_epi32(__m256d a) => System.Runtime.Intrinsics.X86.Avx.ConvertToVector128Int32(a.FP64);
-
-		/// <summary>
-		/// Convert packed double-precision (64-bit) floating-point elements in "a" to packed single-precision (32-bit) floating-point elements, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCVTPD2PS xmm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm256_cvtpd_ps(__m256d a) => System.Runtime.Intrinsics.X86.Avx.ConvertToVector128Single(a.FP64);
-
-		/// <summary>
-		/// Convert packed single-precision (32-bit) floating-point elements in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCVTPS2DQ ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_cvtps_epi32(__m256 a) => System.Runtime.Intrinsics.X86.Avx.ConvertToVector256Int32(a.FP32);
-
-		/// <summary>
-		/// Convert packed single-precision (32-bit) floating-point elements in "a" to packed double-precision (64-bit) floating-point elements, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCVTPS2PD ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_cvtps_pd(__m128 a) => System.Runtime.Intrinsics.X86.Avx.ConvertToVector256Double(a.FP32);
-
-		/// <summary>
-		/// Copy the lower 32-bit integer in "a" to "dst".
-		/// </summary>
-		/// <remarks><c>VMOVD r32, xmm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm256_cvtsi256_si32(__m256i a) => (int)System.Runtime.Intrinsics.X86.Avx2.ConvertToUInt32(a.UI32);
-
-		/// <summary>
-		/// Convert packed double-precision (64-bit) floating-point elements in "a" to packed 32-bit integers with truncation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCVTTPD2DQ xmm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm256_cvttpd_epi32(__m256d a) => System.Runtime.Intrinsics.X86.Avx.ConvertToVector128Int32WithTruncation(a.FP64);
-
-		/// <summary>
-		/// Convert packed single-precision (32-bit) floating-point elements in "a" to packed 32-bit integers with truncation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VCVTTPS2DQ ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_cvttps_epi32(__m256 a) => System.Runtime.Intrinsics.X86.Avx.ConvertToVector256Int32WithTruncation(a.FP32);
-
-		/// <summary>
-		/// Divide packed double-precision (64-bit) floating-point elements in "a" by packed elements in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VDIVPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_div_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.Divide(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Divide packed single-precision (32-bit) floating-point elements in "a" by packed elements in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VDIVPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_div_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.Divide(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Conditionally multiply the packed single-precision (32-bit) floating-point elements in "a" and "b" using the high 4 bits in "imm8", sum the four products, and conditionally store the sum in "dst" using the low 4 bits of "imm8".
-		/// </summary>
-		/// <remarks><c>VDPPS ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_dp_ps(__m256 a, __m256 b, int imm8) => System.Runtime.Intrinsics.X86.Avx.DotProduct(a.FP32, b.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Extract 128 bits (composed of 2 packed double-precision (64-bit) floating-point elements) from "a", selected with "imm8", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>VEXTRACTF128 xmm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm256_extractf128_pd(__m256d a, int imm8) => System.Runtime.Intrinsics.X86.Avx.ExtractVector128(a.FP64, (byte)imm8);
-
-		/// <summary>
-		/// Extract 128 bits (composed of 4 packed single-precision (32-bit) floating-point elements) from "a", selected with "imm8", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>VEXTRACTF128 xmm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm256_extractf128_ps(__m256 a, int imm8) => System.Runtime.Intrinsics.X86.Avx.ExtractVector128(a.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Extract 128 bits (composed of integer data) from "a", selected with "imm8", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>VEXTRACTF128 xmm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {M128}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm256_extractf128_si256(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx.ExtractVector128(a.UI8, (byte)imm8);
-
-		/// <summary>
-		/// Round the packed double-precision (64-bit) floating-point elements in "a" down to an integer value, and store the results as packed double-precision floating-point elements in "dst".
-		/// </summary>
-		/// <remarks><c>VROUNDPD ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_floor_pd(__m256d a) => System.Runtime.Intrinsics.X86.Avx.Floor(a.FP64);
-
-		/// <summary>
-		/// Round the packed single-precision (32-bit) floating-point elements in "a" down to an integer value, and store the results as packed single-precision floating-point elements in "dst".
-		/// </summary>
-		/// <remarks><c>VROUNDPS ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_floor_ps(__m256 a) => System.Runtime.Intrinsics.X86.Avx.Floor(a.FP32);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of double-precision (64-bit) floating-point elements in "a" and "b", and pack the results in "dst".
-		/// </summary>
-		/// <remarks><c>VHADDPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_hadd_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.HorizontalAdd(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of single-precision (32-bit) floating-point elements in "a" and "b", and pack the results in "dst".
-		/// </summary>
-		/// <remarks><c>VHADDPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_hadd_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.HorizontalAdd(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Horizontally subtract adjacent pairs of double-precision (64-bit) floating-point elements in "a" and "b", and pack the results in "dst".
-		/// </summary>
-		/// <remarks><c>VHSUBPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_hsub_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.HorizontalSubtract(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of single-precision (32-bit) floating-point elements in "a" and "b", and pack the results in "dst".
-		/// </summary>
-		/// <remarks><c>VHSUBPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_hsub_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.HorizontalSubtract(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Copy "a" to "dst", then insert 128 bits (composed of 2 packed double-precision (64-bit) floating-point elements) from "b" into "dst" at the location specified by "imm8".
-		/// </summary>
-		/// <remarks><c>VINSERTF128 ymm, ymm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_insertf128_pd(__m256d a, __m128d b, int imm8) => System.Runtime.Intrinsics.X86.Avx.InsertVector128(a.FP64, b.FP64, (byte)imm8);
-
-		/// <summary>
-		/// Copy "a" to "dst", then insert 128 bits (composed of 4 packed single-precision (32-bit) floating-point elements) from "b" into "dst" at the location specified by "imm8".
-		/// </summary>
-		/// <remarks><c>VINSERTF128 ymm, ymm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_insertf128_ps(__m256 a, __m128 b, int imm8) => System.Runtime.Intrinsics.X86.Avx.InsertVector128(a.FP32, b.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Copy "a" to "dst", then insert 128 bits from "b" into "dst" at the location specified by "imm8".
-		/// </summary>
-		/// <remarks><c>VINSERTF128 ymm, ymm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <param name="b"><c>__m128i {M128}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {M128}</c></returns>
-		public static __m256i _mm256_insertf128_si256(__m256i a, __m128i b, int imm8) => System.Runtime.Intrinsics.X86.Avx.InsertVector128(a.UI8, b.UI8, (byte)imm8);
-
-		/// <summary>
-		/// Load 256-bits of integer data from unaligned memory into "dst". This intrinsic may perform better than "_mm256_loadu_si256" when the data crosses a cache line boundary.
-		/// </summary>
-		/// <remarks><c>VLDDQU ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>__m256i {M256}</c></param>
-		/// <returns><c>__m256i dst {M256}</c></returns>
-		public static __m256i _mm256_lddqu_si256(__m256i* mem_addr) => System.Runtime.Intrinsics.X86.Avx.LoadDquVector256((sbyte*)mem_addr);
-
-		/// <summary>
-		/// Load 256-bits (composed of 4 packed double-precision (64-bit) floating-point elements) from memory into "dst".	"mem_addr" must be aligned on a 32-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>VMOVAPD ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_load_pd(double* mem_addr) => System.Runtime.Intrinsics.X86.Avx.LoadAlignedVector256(mem_addr);
-
-		/// <summary>
-		/// Load 256-bits (composed of 8 packed single-precision (32-bit) floating-point elements) from memory into "dst".	"mem_addr" must be aligned on a 32-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>VMOVAPS ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_load_ps(float* mem_addr) => System.Runtime.Intrinsics.X86.Avx.LoadAlignedVector256(mem_addr);
-
-		/// <summary>
-		/// Load 256-bits of integer data from memory into "dst".	"mem_addr" must be aligned on a 32-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>VMOVDQA ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>__m256i {M256}</c></param>
-		/// <returns><c>__m256i dst {M256}</c></returns>
-		public static __m256i _mm256_load_si256(__m256i* mem_addr) => System.Runtime.Intrinsics.X86.Avx.LoadAlignedVector256((sbyte*)mem_addr);
-
-		/// <summary>
-		/// Load 256-bits (composed of 4 packed double-precision (64-bit) floating-point elements) from memory into "dst".	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>VMOVUPD ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_loadu_pd(double* mem_addr) => System.Runtime.Intrinsics.X86.Avx.LoadVector256(mem_addr);
-
-		/// <summary>
-		/// Load 256-bits (composed of 8 packed single-precision (32-bit) floating-point elements) from memory into "dst".	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>VMOVUPS ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_loadu_ps(float* mem_addr) => System.Runtime.Intrinsics.X86.Avx.LoadVector256(mem_addr);
-
-		/// <summary>
-		/// Load 256-bits of integer data from memory into "dst".	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>VMOVDQU ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>__m256i {M256}</c></param>
-		/// <returns><c>__m256i dst {M256}</c></returns>
-		public static __m256i _mm256_loadu_si256(__m256i* mem_addr) => System.Runtime.Intrinsics.X86.Avx.LoadVector256((sbyte*)mem_addr);
-
-		/// <summary>
-		/// Load packed double-precision (64-bit) floating-point elements from memory into "dst" using "mask" (elements are zeroed out when the high bit of the corresponding element is not set).
-		/// </summary>
-		/// <remarks><c>VMASKMOVPD ymm, ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_maskload_pd(double* mem_addr, __m256i mask) => System.Runtime.Intrinsics.X86.Avx.MaskLoad(mem_addr, mask.FP64);
-
-		/// <summary>
-		/// Load packed single-precision (32-bit) floating-point elements from memory into "dst" using "mask" (elements are zeroed out when the high bit of the corresponding element is not set).
-		/// </summary>
-		/// <remarks><c>VMASKMOVPS ymm, ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_maskload_ps(float* mem_addr, __m256i mask) => System.Runtime.Intrinsics.X86.Avx.MaskLoad(mem_addr, mask.FP32);
-
-		/// <summary>
-		/// Store packed double-precision (64-bit) floating-point elements from "a" into memory using "mask".
-		/// </summary>
-		/// <remarks><c>VMASKMOVPD m256, ymm, ymm</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_maskstore_pd(double* mem_addr, __m256i mask, __m256d a) => System.Runtime.Intrinsics.X86.Avx.MaskStore(mem_addr, mask.FP64, a.FP64);
-
-		/// <summary>
-		/// Store packed single-precision (32-bit) floating-point elements from "a" into memory using "mask".
-		/// </summary>
-		/// <remarks><c>VMASKMOVPS m256, ymm, ymm</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_maskstore_ps(float* mem_addr, __m256i mask, __m256 a) => System.Runtime.Intrinsics.X86.Avx.MaskStore(mem_addr, mask.FP32, a.FP32);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>VMAXPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_max_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.Max(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>VMAXPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_max_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.Max(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>VMINPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_min_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.Min(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>VMINPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_min_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.Min(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Duplicate even-indexed double-precision (64-bit) floating-point elements from "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VMOVDDUP ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_movedup_pd(__m256d a) => System.Runtime.Intrinsics.X86.Avx.DuplicateEvenIndexed(a.FP64);
-
-		/// <summary>
-		/// Duplicate odd-indexed single-precision (32-bit) floating-point elements from "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VMOVSHDUP ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_movehdup_ps(__m256 a) => System.Runtime.Intrinsics.X86.Avx.DuplicateOddIndexed(a.FP32);
-
-		/// <summary>
-		/// Duplicate even-indexed single-precision (32-bit) floating-point elements from "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VMOVSLDUP ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_moveldup_ps(__m256 a) => System.Runtime.Intrinsics.X86.Avx.DuplicateEvenIndexed(a.FP32);
-
-		/// <summary>
-		/// Set each bit of mask "dst" based on the most significant bit of the corresponding packed double-precision (64-bit) floating-point element in "a".
-		/// </summary>
-		/// <remarks><c>VMOVMSKPD r32, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm256_movemask_pd(__m256d a) => System.Runtime.Intrinsics.X86.Avx.MoveMask(a.FP64);
-
-		/// <summary>
-		/// Set each bit of mask "dst" based on the most significant bit of the corresponding packed single-precision (32-bit) floating-point element in "a".
-		/// </summary>
-		/// <remarks><c>VMOVMSKPS r32, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm256_movemask_ps(__m256 a) => System.Runtime.Intrinsics.X86.Avx.MoveMask(a.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VMULPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_mul_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.Multiply(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VMULPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_mul_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.Multiply(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise OR of packed double-precision (64-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VORPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_or_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.Or(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise OR of packed single-precision (32-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VORPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_or_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.Or(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Shuffle double-precision (64-bit) floating-point elements in "a" within 128-bit lanes using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERMILPD ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_permute_pd(__m256d a, int imm8) => System.Runtime.Intrinsics.X86.Avx.Permute(a.FP64, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle single-precision (32-bit) floating-point elements in "a" within 128-bit lanes using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERMILPS ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_permute_ps(__m256 a, int imm8) => System.Runtime.Intrinsics.X86.Avx.Permute(a.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle 128-bits (composed of 2 packed double-precision (64-bit) floating-point elements) selected by "imm8" from "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERM2F128 ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_permute2f128_pd(__m256d a, __m256d b, int imm8) => System.Runtime.Intrinsics.X86.Avx.Permute2x128(a.FP64, b.FP64, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle 128-bits (composed of 4 packed single-precision (32-bit) floating-point elements) selected by "imm8" from "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERM2F128 ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_permute2f128_ps(__m256 a, __m256 b, int imm8) => System.Runtime.Intrinsics.X86.Avx.Permute2x128(a.FP32, b.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle 128-bits (composed of integer data) selected by "imm8" from "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERM2F128 ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <param name="b"><c>__m256i {M256}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {M256}</c></returns>
-		public static __m256i _mm256_permute2f128_si256(__m256i a, __m256i b, int imm8) => System.Runtime.Intrinsics.X86.Avx.Permute2x128(a.UI8, b.UI8, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle double-precision (64-bit) floating-point elements in "a" within 128-bit lanes using the control in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERMILPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256i {UI64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_permutevar_pd(__m256d a, __m256i b) => System.Runtime.Intrinsics.X86.Avx.PermuteVar(a.FP64, b.SI64);
-
-		/// <summary>
-		/// Shuffle single-precision (32-bit) floating-point elements in "a" within 128-bit lanes using the control in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERMILPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_permutevar_ps(__m256 a, __m256i b) => System.Runtime.Intrinsics.X86.Avx.PermuteVar(a.FP32, b.SI32);
-
-		/// <summary>
-		/// Compute the approximate reciprocal of packed single-precision (32-bit) floating-point elements in "a", and store the results in "dst". The maximum relative error for this approximation is less than 1.5*2^-12.
-		/// </summary>
-		/// <remarks><c>VRCPPS ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_rcp_ps(__m256 a) => System.Runtime.Intrinsics.X86.Avx.Reciprocal(a.FP32);
-
-		/// <summary>
-		/// Round the packed double-precision (64-bit) floating-point elements in "a" using the "rounding" parameter, and store the results as packed double-precision floating-point elements in "dst".	[round_note]
-		/// </summary>
-		/// <remarks><c>VROUNDPD ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="rounding"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_round_pd(__m256d a, int rounding) => System.Runtime.Intrinsics.X86.Avx.RoundCurrentDirection(a.FP64);
-
-		/// <summary>
-		/// Round the packed single-precision (32-bit) floating-point elements in "a" using the "rounding" parameter, and store the results as packed single-precision floating-point elements in "dst".	[round_note]
-		/// </summary>
-		/// <remarks><c>VROUNDPS ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="rounding"><c>int {IMM}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_round_ps(__m256 a, int rounding) => System.Runtime.Intrinsics.X86.Avx.RoundCurrentDirection(a.FP32);
-
-		/// <summary>
-		/// Compute the approximate reciprocal square root of packed single-precision (32-bit) floating-point elements in "a", and store the results in "dst". The maximum relative error for this approximation is less than 1.5*2^-12.
-		/// </summary>
-		/// <remarks><c>VRSQRTPS ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_rsqrt_ps(__m256 a) => System.Runtime.Intrinsics.X86.Avx.ReciprocalSqrt(a.FP32);
-
-		/// <summary>
-		/// Broadcast 16-bit integer "a" to all all elements of "dst". This intrinsic may generate the "vpbroadcastw".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>short {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_set1_epi16(short a) => System.Runtime.Intrinsics.Vector256.Create((ushort)a);
-
-		/// <summary>
-		/// Broadcast 32-bit integer "a" to all elements of "dst". This intrinsic may generate the "vpbroadcastd".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>int {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_set1_epi32(int a) => System.Runtime.Intrinsics.Vector256.Create((uint)a);
-
-		/// <summary>
-		/// Broadcast 64-bit integer "a" to all elements of "dst". This intrinsic may generate the "vpbroadcastq".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>long {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_set1_epi64x(long a) => System.Runtime.Intrinsics.Vector256.Create((ulong)a);
-
-		/// <summary>
-		/// Broadcast 8-bit integer "a" to all elements of "dst". This intrinsic may generate the "vpbroadcastb".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>byte {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_set1_epi8(byte a) => System.Runtime.Intrinsics.Vector256.Create(a);
-
-		/// <summary>
-		/// Broadcast double-precision (64-bit) floating-point value "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>double {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_set1_pd(double a) => System.Runtime.Intrinsics.Vector256.Create(a);
-
-		/// <summary>
-		/// Broadcast single-precision (32-bit) floating-point value "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>float {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_set1_ps(float a) => System.Runtime.Intrinsics.Vector256.Create(a);
-
-		/// <summary>
-		/// Set packed 16-bit integers in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e15"><c>short {UI16}</c></param>
-		/// <param name="e14"><c>short {UI16}</c></param>
-		/// <param name="e13"><c>short {UI16}</c></param>
-		/// <param name="e12"><c>short {UI16}</c></param>
-		/// <param name="e11"><c>short {UI16}</c></param>
-		/// <param name="e10"><c>short {UI16}</c></param>
-		/// <param name="e9"><c>short {UI16}</c></param>
-		/// <param name="e8"><c>short {UI16}</c></param>
-		/// <param name="e7"><c>short {UI16}</c></param>
-		/// <param name="e6"><c>short {UI16}</c></param>
-		/// <param name="e5"><c>short {UI16}</c></param>
-		/// <param name="e4"><c>short {UI16}</c></param>
-		/// <param name="e3"><c>short {UI16}</c></param>
-		/// <param name="e2"><c>short {UI16}</c></param>
-		/// <param name="e1"><c>short {UI16}</c></param>
-		/// <param name="e0"><c>short {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_setr_epi16(short e15, short e14, short e13, short e12, short e11, short e10, short e9, short e8, short e7, short e6, short e5, short e4, short e3, short e2, short e1, short e0) => System.Runtime.Intrinsics.Vector256.Create((ushort)e15, (ushort)e14, (ushort)e13, (ushort)e12, (ushort)e11, (ushort)e10, (ushort)e9, (ushort)e8, (ushort)e7, (ushort)e6, (ushort)e5, (ushort)e4, (ushort)e3, (ushort)e2, (ushort)e1, (ushort)e0);
-
-		/// <summary>
-		/// Set packed 32-bit integers in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e7"><c>int {UI32}</c></param>
-		/// <param name="e6"><c>int {UI32}</c></param>
-		/// <param name="e5"><c>int {UI32}</c></param>
-		/// <param name="e4"><c>int {UI32}</c></param>
-		/// <param name="e3"><c>int {UI32}</c></param>
-		/// <param name="e2"><c>int {UI32}</c></param>
-		/// <param name="e1"><c>int {UI32}</c></param>
-		/// <param name="e0"><c>int {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_setr_epi32(int e7, int e6, int e5, int e4, int e3, int e2, int e1, int e0) => System.Runtime.Intrinsics.Vector256.Create((uint)e7, (uint)e6, (uint)e5, (uint)e4, (uint)e3, (uint)e2, (uint)e1, (uint)e0);
-
-		/// <summary>
-		/// Set packed 64-bit integers in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e3"><c>long {UI64}</c></param>
-		/// <param name="e2"><c>long {UI64}</c></param>
-		/// <param name="e1"><c>long {UI64}</c></param>
-		/// <param name="e0"><c>long {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_setr_epi64x(long e3, long e2, long e1, long e0) => System.Runtime.Intrinsics.Vector256.Create((ulong)e3, (ulong)e2, (ulong)e1, (ulong)e0);
-
-		/// <summary>
-		/// Set packed 8-bit integers in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e31"><c>byte {UI8}</c></param>
-		/// <param name="e30"><c>byte {UI8}</c></param>
-		/// <param name="e29"><c>byte {UI8}</c></param>
-		/// <param name="e28"><c>byte {UI8}</c></param>
-		/// <param name="e27"><c>byte {UI8}</c></param>
-		/// <param name="e26"><c>byte {UI8}</c></param>
-		/// <param name="e25"><c>byte {UI8}</c></param>
-		/// <param name="e24"><c>byte {UI8}</c></param>
-		/// <param name="e23"><c>byte {UI8}</c></param>
-		/// <param name="e22"><c>byte {UI8}</c></param>
-		/// <param name="e21"><c>byte {UI8}</c></param>
-		/// <param name="e20"><c>byte {UI8}</c></param>
-		/// <param name="e19"><c>byte {UI8}</c></param>
-		/// <param name="e18"><c>byte {UI8}</c></param>
-		/// <param name="e17"><c>byte {UI8}</c></param>
-		/// <param name="e16"><c>byte {UI8}</c></param>
-		/// <param name="e15"><c>byte {UI8}</c></param>
-		/// <param name="e14"><c>byte {UI8}</c></param>
-		/// <param name="e13"><c>byte {UI8}</c></param>
-		/// <param name="e12"><c>byte {UI8}</c></param>
-		/// <param name="e11"><c>byte {UI8}</c></param>
-		/// <param name="e10"><c>byte {UI8}</c></param>
-		/// <param name="e9"><c>byte {UI8}</c></param>
-		/// <param name="e8"><c>byte {UI8}</c></param>
-		/// <param name="e7"><c>byte {UI8}</c></param>
-		/// <param name="e6"><c>byte {UI8}</c></param>
-		/// <param name="e5"><c>byte {UI8}</c></param>
-		/// <param name="e4"><c>byte {UI8}</c></param>
-		/// <param name="e3"><c>byte {UI8}</c></param>
-		/// <param name="e2"><c>byte {UI8}</c></param>
-		/// <param name="e1"><c>byte {UI8}</c></param>
-		/// <param name="e0"><c>byte {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_setr_epi8(byte e31, byte e30, byte e29, byte e28, byte e27, byte e26, byte e25, byte e24, byte e23, byte e22, byte e21, byte e20, byte e19, byte e18, byte e17, byte e16, byte e15, byte e14, byte e13, byte e12, byte e11, byte e10, byte e9, byte e8, byte e7, byte e6, byte e5, byte e4, byte e3, byte e2, byte e1, byte e0) => System.Runtime.Intrinsics.Vector256.Create(e31, e30, e29, e28, e27, e26, e25, e24, e23, e22, e21, e20, e19, e18, e17, e16, e15, e14, e13, e12, e11, e10, e9, e8, e7, e6, e5, e4, e3, e2, e1, e0);
-
-		/// <summary>
-		/// Set packed __m256 vector "dst" with the supplied values.
-		/// </summary>
-		/// <remarks><c>VINSERTF128 ymm, ymm, xmm, imm8</c></remarks>
-		/// <param name="lo"><c>__m128 {FP32}</c></param>
-		/// <param name="hi"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_setr_m128(__m128 lo, __m128 hi) => System.Runtime.Intrinsics.Vector256.Create(lo.FP32, hi.FP32);
-
-		/// <summary>
-		/// Set packed __m256d vector "dst" with the supplied values.
-		/// </summary>
-		/// <remarks><c>VINSERTF128 ymm, ymm, xmm, imm8</c></remarks>
-		/// <param name="lo"><c>__m128d {FP64}</c></param>
-		/// <param name="hi"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_setr_m128d(__m128d lo, __m128d hi) => System.Runtime.Intrinsics.Vector256.Create(lo.FP64, hi.FP64);
-
-		/// <summary>
-		/// Set packed __m256i vector "dst" with the supplied values.
-		/// </summary>
-		/// <remarks><c>VINSERTF128 ymm, ymm, xmm, imm8</c></remarks>
-		/// <param name="lo"><c>__m128i {M128}</c></param>
-		/// <param name="hi"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m256i dst {M128}</c></returns>
-		public static __m256i _mm256_setr_m128i(__m128i lo, __m128i hi) => System.Runtime.Intrinsics.Vector256.Create(lo.SI32, hi.SI32);
-
-		/// <summary>
-		/// Set packed double-precision (64-bit) floating-point elements in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e3"><c>double {FP64}</c></param>
-		/// <param name="e2"><c>double {FP64}</c></param>
-		/// <param name="e1"><c>double {FP64}</c></param>
-		/// <param name="e0"><c>double {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_setr_pd(double e3, double e2, double e1, double e0) => System.Runtime.Intrinsics.Vector256.Create(e3, e2, e1, e0);
-
-		/// <summary>
-		/// Set packed single-precision (32-bit) floating-point elements in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e7"><c>float {FP32}</c></param>
-		/// <param name="e6"><c>float {FP32}</c></param>
-		/// <param name="e5"><c>float {FP32}</c></param>
-		/// <param name="e4"><c>float {FP32}</c></param>
-		/// <param name="e3"><c>float {FP32}</c></param>
-		/// <param name="e2"><c>float {FP32}</c></param>
-		/// <param name="e1"><c>float {FP32}</c></param>
-		/// <param name="e0"><c>float {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_setr_ps(float e7, float e6, float e5, float e4, float e3, float e2, float e1, float e0) => System.Runtime.Intrinsics.Vector256.Create(e7, e6, e5, e4, e3, e2, e1, e0);
-
-		/// <summary>
-		/// Shuffle double-precision (64-bit) floating-point elements within 128-bit lanes using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VSHUFPD ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_shuffle_pd(__m256d a, __m256d b, int imm8) => System.Runtime.Intrinsics.X86.Avx.Shuffle(a.FP64, b.FP64, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle single-precision (32-bit) floating-point elements in "a" within 128-bit lanes using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VSHUFPS ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_shuffle_ps(__m256 a, __m256 b, int imm8) => System.Runtime.Intrinsics.X86.Avx.Shuffle(a.FP32, b.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Compute the square root of packed double-precision (64-bit) floating-point elements in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VSQRTPD ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_sqrt_pd(__m256d a) => System.Runtime.Intrinsics.X86.Avx.Sqrt(a.FP64);
-
-		/// <summary>
-		/// Compute the square root of packed single-precision (32-bit) floating-point elements in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VSQRTPS ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_sqrt_ps(__m256 a) => System.Runtime.Intrinsics.X86.Avx.Sqrt(a.FP32);
-
-		/// <summary>
-		/// Store 256-bits (composed of 4 packed double-precision (64-bit) floating-point elements) from "a" into memory.	"mem_addr" must be aligned on a 32-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>VMOVAPD m256, ymm</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_store_pd(double* mem_addr, __m256d a) => System.Runtime.Intrinsics.X86.Avx.StoreAligned(mem_addr, a.FP64);
-
-		/// <summary>
-		/// Store 256-bits (composed of 8 packed single-precision (32-bit) floating-point elements) from "a" into memory.	"mem_addr" must be aligned on a 32-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>VMOVAPS m256, ymm</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_store_ps(float* mem_addr, __m256 a) => System.Runtime.Intrinsics.X86.Avx.StoreAligned(mem_addr, a.FP32);
-
-		/// <summary>
-		/// Store 256-bits of integer data from "a" into memory.	"mem_addr" must be aligned on a 32-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>VMOVDQA m256, ymm</c></remarks>
-		/// <param name="mem_addr"><c>__m256i {M256}</c></param>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_store_si256(__m256i* mem_addr, __m256i a) => System.Runtime.Intrinsics.X86.Avx.StoreAligned((sbyte*)mem_addr, a.SI8);
-
-		/// <summary>
-		/// Store 256-bits (composed of 4 packed double-precision (64-bit) floating-point elements) from "a" into memory.	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>VMOVUPD m256, ymm</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_storeu_pd(double* mem_addr, __m256d a) => System.Runtime.Intrinsics.X86.Avx.Store(mem_addr, a.FP64);
-
-		/// <summary>
-		/// Store 256-bits (composed of 8 packed single-precision (32-bit) floating-point elements) from "a" into memory.	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>VMOVUPS m256, ymm</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_storeu_ps(float* mem_addr, __m256 a) => System.Runtime.Intrinsics.X86.Avx.Store(mem_addr, a.FP32);
-
-		/// <summary>
-		/// Store 256-bits of integer data from "a" into memory.	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>VMOVDQU m256, ymm</c></remarks>
-		/// <param name="mem_addr"><c>__m256i {M256}</c></param>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_storeu_si256(__m256i* mem_addr, __m256i a) => System.Runtime.Intrinsics.X86.Avx.Store((sbyte*)mem_addr, a.SI8);
-
-		/// <summary>
-		/// Store 256-bits (composed of 4 packed double-precision (64-bit) floating-point elements) from "a" into memory using a non-temporal memory hint.	"mem_addr" must be aligned on a 32-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>VMOVNTPD m256, ymm</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_stream_pd(double* mem_addr, __m256d a) => System.Runtime.Intrinsics.X86.Avx.StoreAlignedNonTemporal(mem_addr, a.FP64);
-
-		/// <summary>
-		/// Store 256-bits (composed of 8 packed single-precision (32-bit) floating-point elements) from "a" into memory using a non-temporal memory hint.	"mem_addr" must be aligned on a 32-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>VMOVNTPS m256, ymm</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_stream_ps(float* mem_addr, __m256 a) => System.Runtime.Intrinsics.X86.Avx.StoreAlignedNonTemporal(mem_addr, a.FP32);
-
-		/// <summary>
-		/// Store 256-bits of integer data from "a" into memory using a non-temporal memory hint.	"mem_addr" must be aligned on a 32-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>VMOVNTDQ m256, ymm</c></remarks>
-		/// <param name="mem_addr"><c>__m256i {M256}</c></param>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_stream_si256(__m256i* mem_addr, __m256i a) => System.Runtime.Intrinsics.X86.Avx.StoreAlignedNonTemporal((sbyte*)mem_addr, a.SI8);
-
-		/// <summary>
-		/// Subtract packed double-precision (64-bit) floating-point elements in "b" from packed double-precision (64-bit) floating-point elements in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VSUBPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_sub_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.Subtract(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Subtract packed single-precision (32-bit) floating-point elements in "b" from packed single-precision (32-bit) floating-point elements in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VSUBPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_sub_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.Subtract(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise AND of 256 bits (representing double-precision (64-bit) floating-point elements) in "a" and "b", producing an intermediate 256-bit value, and set "ZF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return the "CF" value.
-		/// </summary>
-		/// <remarks><c>VTESTPD ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm256_testc_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.TestC(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise AND of 256 bits (representing single-precision (32-bit) floating-point elements) in "a" and "b", producing an intermediate 256-bit value, and set "ZF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return the "CF" value.
-		/// </summary>
-		/// <remarks><c>VTESTPS ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm256_testc_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.TestC(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise AND of 256 bits (representing integer data) in "a" and "b", and set "ZF" to 1 if the result is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", and set "CF" to 1 if the result is zero, otherwise set "CF" to 0. Return the "CF" value.
-		/// </summary>
-		/// <remarks><c>VPTEST ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <param name="b"><c>__m256i {M256}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm256_testc_si256(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx.TestC(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Compute the bitwise AND of 256 bits (representing double-precision (64-bit) floating-point elements) in "a" and "b", producing an intermediate 256-bit value, and set "ZF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return 1 if both the "ZF" and "CF" values are zero, otherwise return 0.
-		/// </summary>
-		/// <remarks><c>VTESTPD ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm256_testnzc_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.TestNotZAndNotC(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise AND of 256 bits (representing single-precision (32-bit) floating-point elements) in "a" and "b", producing an intermediate 256-bit value, and set "ZF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return 1 if both the "ZF" and "CF" values are zero, otherwise return 0.
-		/// </summary>
-		/// <remarks><c>VTESTPS ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm256_testnzc_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.TestNotZAndNotC(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise AND of 256 bits (representing integer data) in "a" and "b", and set "ZF" to 1 if the result is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", and set "CF" to 1 if the result is zero, otherwise set "CF" to 0. Return 1 if both the "ZF" and "CF" values are zero, otherwise return 0.
-		/// </summary>
-		/// <remarks><c>VPTEST ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <param name="b"><c>__m256i {M256}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm256_testnzc_si256(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx.TestNotZAndNotC(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Compute the bitwise AND of 256 bits (representing double-precision (64-bit) floating-point elements) in "a" and "b", producing an intermediate 256-bit value, and set "ZF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 64-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return the "ZF" value.
-		/// </summary>
-		/// <remarks><c>VTESTPD ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm256_testz_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.TestZ(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise AND of 256 bits (representing single-precision (32-bit) floating-point elements) in "a" and "b", producing an intermediate 256-bit value, and set "ZF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", producing an intermediate value, and set "CF" to 1 if the sign bit of each 32-bit element in the intermediate value is zero, otherwise set "CF" to 0. Return the "ZF" value.
-		/// </summary>
-		/// <remarks><c>VTESTPS ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm256_testz_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.TestZ(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise AND of 256 bits (representing integer data) in "a" and "b", and set "ZF" to 1 if the result is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", and set "CF" to 1 if the result is zero, otherwise set "CF" to 0. Return the "ZF" value.
-		/// </summary>
-		/// <remarks><c>VPTEST ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <param name="b"><c>__m256i {M256}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm256_testz_si256(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx.TestZ(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Unpack and interleave double-precision (64-bit) floating-point elements from the high half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VUNPCKHPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_unpackhi_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.UnpackHigh(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Unpack and interleave single-precision (32-bit) floating-point elements from the high half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VUNPCKHPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_unpackhi_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.UnpackHigh(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Unpack and interleave double-precision (64-bit) floating-point elements from the low half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VUNPCKLPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_unpacklo_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.UnpackLow(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Unpack and interleave single-precision (32-bit) floating-point elements from the low half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VUNPCKLPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_unpacklo_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.UnpackLow(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise XOR of packed double-precision (64-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VXORPD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_xor_pd(__m256d a, __m256d b) => System.Runtime.Intrinsics.X86.Avx.Xor(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise XOR of packed single-precision (32-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VXORPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_xor_ps(__m256 a, __m256 b) => System.Runtime.Intrinsics.X86.Avx.Xor(a.FP32, b.FP32);
-
-	}
-}
diff --git a/src/External/RawIntrinsics/AVX2.cs b/src/External/RawIntrinsics/AVX2.cs
deleted file mode 100644
index 931839c..0000000
--- a/src/External/RawIntrinsics/AVX2.cs
+++ /dev/null
@@ -1,1726 +0,0 @@
-namespace RawIntrinsics
-{
-	public static unsafe partial class AVX2
-	{
-		/// <summary>
-		/// Blend packed 32-bit integers from "a" and "b" using control mask "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPBLENDD xmm, xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="b"><c>__m128i {UI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_blend_epi32(__m128i a, __m128i b, int imm8) => System.Runtime.Intrinsics.X86.Avx2.Blend(a.UI32, b.UI32, (byte)imm8);
-
-		/// <summary>
-		/// Broadcast the low packed 8-bit integer from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VPBROADCASTB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_broadcastb_epi8(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector128(a.UI8);
-
-		/// <summary>
-		/// Broadcast the low packed 32-bit integer from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VPBROADCASTD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_broadcastd_epi32(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector128(a.UI32);
-
-		/// <summary>
-		/// Broadcast the low packed 64-bit integer from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VPBROADCASTQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_broadcastq_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector128(a.UI64);
-
-		/// <summary>
-		/// Broadcast the low double-precision (64-bit) floating-point element from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>MOVDDUP xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_broadcastsd_pd(__m128d a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector128(a.FP64);
-
-		/// <summary>
-		/// Broadcast the low single-precision (32-bit) floating-point element from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VBROADCASTSS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_broadcastss_ps(__m128 a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector128(a.FP32);
-
-		/// <summary>
-		/// Broadcast the low packed 16-bit integer from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VPBROADCASTW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_broadcastw_epi16(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector128(a.UI16);
-
-		/// <summary>
-		/// Gather 32-bit integers from memory using 32-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERDD xmm, vm32x, xmm</c></remarks>
-		/// <param name="base_addr"><c>int {UI32}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_i32gather_epi32(int* base_addr, __m128i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector128((uint*)base_addr, vindex.SI32, (byte)scale);
-
-		/// <summary>
-		/// Gather 64-bit integers from memory using 32-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERDQ xmm, vm32x, xmm</c></remarks>
-		/// <param name="base_addr"><c>long {UI64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_i32gather_epi64(long* base_addr, __m128i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector128((ulong*)base_addr, vindex.SI32, (byte)scale);
-
-		/// <summary>
-		/// Gather double-precision (64-bit) floating-point elements from memory using 32-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERDPD xmm, vm32x, xmm</c></remarks>
-		/// <param name="base_addr"><c>double {FP64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_i32gather_pd(double* base_addr, __m128i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector128(base_addr, vindex.SI32, (byte)scale);
-
-		/// <summary>
-		/// Gather single-precision (32-bit) floating-point elements from memory using 32-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERDPS xmm, vm32x, xmm</c></remarks>
-		/// <param name="base_addr"><c>float {FP32}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_i32gather_ps(float* base_addr, __m128i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector128(base_addr, vindex.SI32, (byte)scale);
-
-		/// <summary>
-		/// Gather 32-bit integers from memory using 64-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERQD xmm, vm64x, xmm</c></remarks>
-		/// <param name="base_addr"><c>int {UI32}</c></param>
-		/// <param name="vindex"><c>__m128i {SI64}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_i64gather_epi32(int* base_addr, __m128i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector128((uint*)base_addr, vindex.SI64, (byte)scale);
-
-		/// <summary>
-		/// Gather 64-bit integers from memory using 64-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERQQ xmm, vm64x, xmm</c></remarks>
-		/// <param name="base_addr"><c>long {UI64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI64}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_i64gather_epi64(long* base_addr, __m128i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector128((ulong*)base_addr, vindex.SI64, (byte)scale);
-
-		/// <summary>
-		/// Gather double-precision (64-bit) floating-point elements from memory using 64-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERQPD xmm, vm64x, xmm</c></remarks>
-		/// <param name="base_addr"><c>double {FP64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI64}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_i64gather_pd(double* base_addr, __m128i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector128(base_addr, vindex.SI64, (byte)scale);
-
-		/// <summary>
-		/// Gather single-precision (32-bit) floating-point elements from memory using 64-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERQPS xmm, vm64x, xmm</c></remarks>
-		/// <param name="base_addr"><c>float {FP32}</c></param>
-		/// <param name="vindex"><c>__m128i {SI64}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_i64gather_ps(float* base_addr, __m128i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector128(base_addr, vindex.SI64, (byte)scale);
-
-		/// <summary>
-		/// Gather 32-bit integers from memory using 32-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERDD xmm, vm32x, xmm</c></remarks>
-		/// <param name="src"><c>__m128i {UI32}</c></param>
-		/// <param name="base_addr"><c>int {UI32}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_mask_i32gather_epi32(__m128i src, int* base_addr, __m128i vindex, __m128i mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector128(src.UI32, (uint*)base_addr, vindex.SI32, mask.UI32, (byte)scale);
-
-		/// <summary>
-		/// Gather 64-bit integers from memory using 32-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERDQ xmm, vm32x, xmm</c></remarks>
-		/// <param name="src"><c>__m128i {UI64}</c></param>
-		/// <param name="base_addr"><c>long {UI64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_mask_i32gather_epi64(__m128i src, long* base_addr, __m128i vindex, __m128i mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector128(src.UI64, (ulong*)base_addr, vindex.SI32, mask.UI64, (byte)scale);
-
-		/// <summary>
-		/// Gather double-precision (64-bit) floating-point elements from memory using 32-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERDPD xmm, vm32x, xmm</c></remarks>
-		/// <param name="src"><c>__m128d {FP64}</c></param>
-		/// <param name="base_addr"><c>double {FP64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="mask"><c>__m128d {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_mask_i32gather_pd(__m128d src, double* base_addr, __m128i vindex, __m128d mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector128(src.FP64, base_addr, vindex.SI32, mask.FP64, (byte)scale);
-
-		/// <summary>
-		/// Gather single-precision (32-bit) floating-point elements from memory using 32-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERDPS xmm, vm32x, xmm</c></remarks>
-		/// <param name="src"><c>__m128 {FP32}</c></param>
-		/// <param name="base_addr"><c>float {FP32}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="mask"><c>__m128 {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_mask_i32gather_ps(__m128 src, float* base_addr, __m128i vindex, __m128 mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector128(src.FP32, base_addr, vindex.SI32, mask.FP32, (byte)scale);
-
-		/// <summary>
-		/// Gather 32-bit integers from memory using 64-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERQD xmm, vm64x, xmm</c></remarks>
-		/// <param name="src"><c>__m128i {UI32}</c></param>
-		/// <param name="base_addr"><c>int {UI32}</c></param>
-		/// <param name="vindex"><c>__m128i {SI64}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_mask_i64gather_epi32(__m128i src, int* base_addr, __m128i vindex, __m128i mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector128(src.UI32, (uint*)base_addr, vindex.SI64, mask.UI32, (byte)scale);
-
-		/// <summary>
-		/// Gather 64-bit integers from memory using 64-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERQQ xmm, vm64x, xmm</c></remarks>
-		/// <param name="src"><c>__m128i {UI64}</c></param>
-		/// <param name="base_addr"><c>long {UI64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI64}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_mask_i64gather_epi64(__m128i src, long* base_addr, __m128i vindex, __m128i mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector128(src.UI64, (ulong*)base_addr, vindex.SI64, mask.UI64, (byte)scale);
-
-		/// <summary>
-		/// Gather double-precision (64-bit) floating-point elements from memory using 64-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERQPD xmm, vm64x, xmm</c></remarks>
-		/// <param name="src"><c>__m128d {FP64}</c></param>
-		/// <param name="base_addr"><c>double {FP64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI64}</c></param>
-		/// <param name="mask"><c>__m128d {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_mask_i64gather_pd(__m128d src, double* base_addr, __m128i vindex, __m128d mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector128(src.FP64, base_addr, vindex.SI64, mask.FP64, (byte)scale);
-
-		/// <summary>
-		/// Gather single-precision (32-bit) floating-point elements from memory using 64-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERQPS xmm, vm64x, xmm</c></remarks>
-		/// <param name="src"><c>__m128 {FP32}</c></param>
-		/// <param name="base_addr"><c>float {FP32}</c></param>
-		/// <param name="vindex"><c>__m128i {SI64}</c></param>
-		/// <param name="mask"><c>__m128 {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_mask_i64gather_ps(__m128 src, float* base_addr, __m128i vindex, __m128 mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector128(src.FP32, base_addr, vindex.SI64, mask.FP32, (byte)scale);
-
-		/// <summary>
-		/// Load packed 32-bit integers from memory into "dst" using "mask" (elements are zeroed out when the highest bit is not set in the corresponding element).
-		/// </summary>
-		/// <remarks><c>VPMASKMOVD xmm, xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>int {UI32}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_maskload_epi32(int* mem_addr, __m128i mask) => System.Runtime.Intrinsics.X86.Avx2.MaskLoad((uint*)mem_addr, mask.UI32);
-
-		/// <summary>
-		/// Load packed 64-bit integers from memory into "dst" using "mask" (elements are zeroed out when the highest bit is not set in the corresponding element).
-		/// </summary>
-		/// <remarks><c>VPMASKMOVQ xmm, xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>long {UI64}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_maskload_epi64(long* mem_addr, __m128i mask) => System.Runtime.Intrinsics.X86.Avx2.MaskLoad((ulong*)mem_addr, mask.UI64);
-
-		/// <summary>
-		/// Store packed 32-bit integers from "a" into memory using "mask" (elements are not stored when the highest bit is not set in the corresponding element).
-		/// </summary>
-		/// <remarks><c>VPMASKMOVD m128, xmm, xmm</c></remarks>
-		/// <param name="mem_addr"><c>int {UI32}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_maskstore_epi32(int* mem_addr, __m128i mask, __m128i a) => System.Runtime.Intrinsics.X86.Avx2.MaskStore((uint*)mem_addr, mask.UI32, a.UI32);
-
-		/// <summary>
-		/// Store packed 64-bit integers from "a" into memory using "mask" (elements are not stored when the highest bit is not set in the corresponding element).
-		/// </summary>
-		/// <remarks><c>VPMASKMOVQ m128, xmm, xmm</c></remarks>
-		/// <param name="mem_addr"><c>long {UI64}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_maskstore_epi64(long* mem_addr, __m128i mask, __m128i a) => System.Runtime.Intrinsics.X86.Avx2.MaskStore((ulong*)mem_addr, mask.UI64, a.UI64);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" left by the amount specified by the corresponding element in "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSLLVD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="count"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_sllv_epi32(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftLeftLogicalVariable(a.UI32, count.UI32);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" left by the amount specified by the corresponding element in "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSLLVQ xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="count"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_sllv_epi64(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftLeftLogicalVariable(a.UI64, count.UI64);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" right by the amount specified by the corresponding element in "count" while shifting in sign bits, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRAVD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="count"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_srav_epi32(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightArithmeticVariable(a.SI32, count.UI32);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" right by the amount specified by the corresponding element in "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRLVD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="count"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_srlv_epi32(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightLogicalVariable(a.UI32, count.UI32);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" right by the amount specified by the corresponding element in "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRLVQ xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="count"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_srlv_epi64(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightLogicalVariable(a.UI64, count.UI64);
-
-		/// <summary>
-		/// Compute the absolute value of packed signed 16-bit integers in "a", and store the unsigned results in "dst".
-		/// </summary>
-		/// <remarks><c>VPABSW ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_abs_epi16(__m256i a) => System.Runtime.Intrinsics.X86.Avx2.Abs(a.SI16);
-
-		/// <summary>
-		/// Compute the absolute value of packed signed 32-bit integers in "a", and store the unsigned results in "dst".
-		/// </summary>
-		/// <remarks><c>VPABSD ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_abs_epi32(__m256i a) => System.Runtime.Intrinsics.X86.Avx2.Abs(a.SI32);
-
-		/// <summary>
-		/// Compute the absolute value of packed signed 8-bit integers in "a", and store the unsigned results in "dst".
-		/// </summary>
-		/// <remarks><c>VPABSB ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_abs_epi8(__m256i a) => System.Runtime.Intrinsics.X86.Avx2.Abs(a.SI8);
-
-		/// <summary>
-		/// Add packed 16-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPADDW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_add_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Add(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Add packed 32-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPADDD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_add_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Add(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Add packed 64-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPADDQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="b"><c>__m256i {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_add_epi64(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Add(a.UI64, b.UI64);
-
-		/// <summary>
-		/// Add packed 8-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPADDB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_add_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Add(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Add packed 16-bit integers in "a" and "b" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPADDSW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_adds_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.AddSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Add packed 8-bit integers in "a" and "b" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPADDSB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI8}</c></param>
-		/// <param name="b"><c>__m256i {SI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_adds_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.AddSaturate(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Add packed unsigned 16-bit integers in "a" and "b" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPADDUSW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_adds_epu16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.AddSaturate(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Add packed unsigned 8-bit integers in "a" and "b" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPADDUSB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_adds_epu8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.AddSaturate(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Concatenate pairs of 16-byte blocks in "a" and "b" into a 32-byte temporary result, shift the result right by "imm8" bytes, and store the low 16 bytes in "dst".
-		/// </summary>
-		/// <remarks><c>VPALIGNR ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_alignr_epi8(__m256i a, __m256i b, int imm8) => System.Runtime.Intrinsics.X86.Avx2.AlignRight(a.UI8, b.UI8, (byte)imm8);
-
-		/// <summary>
-		/// Compute the bitwise AND of 256 bits (representing integer data) in "a" and "b", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>VPAND ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <param name="b"><c>__m256i {M256}</c></param>
-		/// <returns><c>__m256i dst {M256}</c></returns>
-		public static __m256i _mm256_and_si256(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.And(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Compute the bitwise NOT of 256 bits (representing integer data) in "a" and then AND with "b", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>VPANDN ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <param name="b"><c>__m256i {M256}</c></param>
-		/// <returns><c>__m256i dst {M256}</c></returns>
-		public static __m256i _mm256_andnot_si256(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.AndNot(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Average packed unsigned 16-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPAVGW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_avg_epu16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Average(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Average packed unsigned 8-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPAVGB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_avg_epu8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Average(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Blend packed 16-bit integers from "a" and "b" within 128-bit lanes using control mask "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPBLENDW ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_blend_epi16(__m256i a, __m256i b, int imm8) => System.Runtime.Intrinsics.X86.Avx2.Blend(a.UI16, b.UI16, (byte)imm8);
-
-		/// <summary>
-		/// Blend packed 32-bit integers from "a" and "b" using control mask "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPBLENDD ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_blend_epi32(__m256i a, __m256i b, int imm8) => System.Runtime.Intrinsics.X86.Avx2.Blend(a.UI32, b.UI32, (byte)imm8);
-
-		/// <summary>
-		/// Blend packed 8-bit integers from "a" and "b" using "mask", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPBLENDVB ymm, ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_blendv_epi8(__m256i a, __m256i b, __m256i mask) => System.Runtime.Intrinsics.X86.Avx2.BlendVariable(a.UI8, b.UI8, mask.UI8);
-
-		/// <summary>
-		/// Broadcast the low packed 8-bit integer from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VPBROADCASTB ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_broadcastb_epi8(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector256(a.UI8);
-
-		/// <summary>
-		/// Broadcast the low packed 32-bit integer from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VPBROADCASTD ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_broadcastd_epi32(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector256(a.UI32);
-
-		/// <summary>
-		/// Broadcast the low packed 64-bit integer from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VPBROADCASTQ ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_broadcastq_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector256(a.UI64);
-
-		/// <summary>
-		/// Broadcast the low double-precision (64-bit) floating-point element from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VBROADCASTSD ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_broadcastsd_pd(__m128d a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector256(a.FP64);
-
-		/// <summary>
-		/// Broadcast 128 bits of integer data from "a" to all 128-bit lanes in "dst".
-		/// </summary>
-		/// <remarks><c>VBROADCASTI128 ymm, m128</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m256i dst {M128}</c></returns>
-		public static __m256i _mm256_broadcastsi128_si256(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastVector128ToVector256((sbyte*)&a);
-
-		/// <summary>
-		/// Broadcast the low single-precision (32-bit) floating-point element from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VBROADCASTSS ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_broadcastss_ps(__m128 a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector256(a.FP32);
-
-		/// <summary>
-		/// Broadcast the low packed 16-bit integer from "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c>VPBROADCASTW ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_broadcastw_epi16(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.BroadcastScalarToVector256(a.UI16);
-
-		/// <summary>
-		/// Shift 128-bit lanes in "a" left by "imm8" bytes while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSLLDQ ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {M128}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {M128}</c></returns>
-		public static __m256i _mm256_bslli_epi128(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShiftLeftLogical128BitLane(a.SI8, (byte)imm8);
-
-		/// <summary>
-		/// Shift 128-bit lanes in "a" right by "imm8" bytes while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRLDQ ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {M128}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {M128}</c></returns>
-		public static __m256i _mm256_bsrli_epi128(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightLogical128BitLane(a.SI8, (byte)imm8);
-
-		/// <summary>
-		/// Compare packed 16-bit integers in "a" and "b" for equality, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPCMPEQW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_cmpeq_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.CompareEqual(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Compare packed 32-bit integers in "a" and "b" for equality, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPCMPEQD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_cmpeq_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.CompareEqual(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Compare packed 64-bit integers in "a" and "b" for equality, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPCMPEQQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="b"><c>__m256i {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_cmpeq_epi64(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.CompareEqual(a.UI64, b.UI64);
-
-		/// <summary>
-		/// Compare packed 8-bit integers in "a" and "b" for equality, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPCMPEQB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_cmpeq_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.CompareEqual(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Compare packed signed 16-bit integers in "a" and "b" for greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPCMPGTW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_cmpgt_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.CompareGreaterThan(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Compare packed signed 32-bit integers in "a" and "b" for greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPCMPGTD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <param name="b"><c>__m256i {SI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_cmpgt_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.CompareGreaterThan(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Compare packed signed 64-bit integers in "a" and "b" for greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPCMPGTQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI64}</c></param>
-		/// <param name="b"><c>__m256i {SI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_cmpgt_epi64(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.CompareGreaterThan(a.SI64, b.SI64);
-
-		/// <summary>
-		/// Compare packed signed 8-bit integers in "a" and "b" for greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPCMPGTB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI8}</c></param>
-		/// <param name="b"><c>__m256i {SI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_cmpgt_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.CompareGreaterThan(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Sign extend packed 16-bit integers in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVSXWD ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m256i dst {SI32}</c></returns>
-		public static __m256i _mm256_cvtepi16_epi32(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int32(a.SI16);
-
-		/// <summary>
-		/// Sign extend packed 16-bit integers in "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVSXWQ ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m256i dst {SI64}</c></returns>
-		public static __m256i _mm256_cvtepi16_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int64(a.SI16);
-
-		/// <summary>
-		/// Sign extend packed 32-bit integers in "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVSXDQ ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m256i dst {SI64}</c></returns>
-		public static __m256i _mm256_cvtepi32_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int64(a.SI32);
-
-		/// <summary>
-		/// Sign extend packed 8-bit integers in "a" to packed 16-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVSXBW ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m256i dst {SI16}</c></returns>
-		public static __m256i _mm256_cvtepi8_epi16(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int16(a.SI8);
-
-		/// <summary>
-		/// Sign extend packed 8-bit integers in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVSXBD ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m256i dst {SI32}</c></returns>
-		public static __m256i _mm256_cvtepi8_epi32(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int32(a.SI8);
-
-		/// <summary>
-		/// Sign extend packed 8-bit integers in the low 8 bytes of "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVSXBQ ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m256i dst {SI64}</c></returns>
-		public static __m256i _mm256_cvtepi8_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int64(a.SI8);
-
-		/// <summary>
-		/// Zero extend packed unsigned 16-bit integers in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVZXWD ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_cvtepu16_epi32(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int32(a.UI16);
-
-		/// <summary>
-		/// Zero extend packed unsigned 16-bit integers in "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVZXWQ ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_cvtepu16_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int64(a.UI16);
-
-		/// <summary>
-		/// Zero extend packed unsigned 32-bit integers in "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVZXDQ ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_cvtepu32_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int64(a.UI32);
-
-		/// <summary>
-		/// Zero extend packed unsigned 8-bit integers in "a" to packed 16-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVZXBW ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_cvtepu8_epi16(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int16(a.UI8);
-
-		/// <summary>
-		/// Zero extend packed unsigned 8-bit integers in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVZXBD ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_cvtepu8_epi32(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int32(a.UI8);
-
-		/// <summary>
-		/// Zero extend packed unsigned 8-bit integers in the low 8 byte sof "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVZXBQ ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_cvtepu8_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Avx2.ConvertToVector256Int64(a.UI8);
-
-		/// <summary>
-		/// Extract 128 bits (composed of integer data) from "a", selected with "imm8", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>VEXTRACTI128 xmm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {M128}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm256_extracti128_si256(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ExtractVector128(a.SI8, (byte)imm8);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of 16-bit integers in "a" and "b", and pack the signed 16-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>VPHADDW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_hadd_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.HorizontalAdd(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of 32-bit integers in "a" and "b", and pack the signed 32-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>VPHADDD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_hadd_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.HorizontalAdd(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of signed 16-bit integers in "a" and "b" using saturation, and pack the signed 16-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>VPHADDSW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_hadds_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.HorizontalAddSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Horizontally subtract adjacent pairs of 16-bit integers in "a" and "b", and pack the signed 16-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>VPHSUBW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_hsub_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.HorizontalSubtract(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Horizontally subtract adjacent pairs of 32-bit integers in "a" and "b", and pack the signed 32-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>VPHSUBD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_hsub_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.HorizontalSubtract(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Horizontally subtract adjacent pairs of signed 16-bit integers in "a" and "b" using saturation, and pack the signed 16-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>VPHSUBSW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_hsubs_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.HorizontalSubtractSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Gather 32-bit integers from memory using 32-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERDD ymm, vm32x, ymm</c></remarks>
-		/// <param name="base_addr"><c>int {UI32}</c></param>
-		/// <param name="vindex"><c>__m256i {SI32}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_i32gather_epi32(int* base_addr, __m256i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector256((uint*)base_addr, vindex.SI32, (byte)scale);
-
-		/// <summary>
-		/// Gather 64-bit integers from memory using 32-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERDQ ymm, vm32x, ymm</c></remarks>
-		/// <param name="base_addr"><c>long {UI64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_i32gather_epi64(long* base_addr, __m128i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector256((ulong*)base_addr, vindex.SI32, (byte)scale);
-
-		/// <summary>
-		/// Gather double-precision (64-bit) floating-point elements from memory using 32-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERDPD ymm, vm32x, ymm</c></remarks>
-		/// <param name="base_addr"><c>double {FP64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_i32gather_pd(double* base_addr, __m128i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector256(base_addr, vindex.SI32, (byte)scale);
-
-		/// <summary>
-		/// Gather single-precision (32-bit) floating-point elements from memory using 32-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERDPS ymm, vm32x, ymm</c></remarks>
-		/// <param name="base_addr"><c>float {FP32}</c></param>
-		/// <param name="vindex"><c>__m256i {SI32}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_i32gather_ps(float* base_addr, __m256i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector256(base_addr, vindex.SI32, (byte)scale);
-
-		/// <summary>
-		/// Gather 32-bit integers from memory using 64-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERQD xmm, vm64y, xmm</c></remarks>
-		/// <param name="base_addr"><c>int {UI32}</c></param>
-		/// <param name="vindex"><c>__m256i {SI64}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm256_i64gather_epi32(int* base_addr, __m256i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector128((uint*)base_addr, vindex.SI64, (byte)scale);
-
-		/// <summary>
-		/// Gather 64-bit integers from memory using 64-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERQQ ymm, vm64x, ymm</c></remarks>
-		/// <param name="base_addr"><c>long {UI64}</c></param>
-		/// <param name="vindex"><c>__m256i {SI64}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_i64gather_epi64(long* base_addr, __m256i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector256((ulong*)base_addr, vindex.SI64, (byte)scale);
-
-		/// <summary>
-		/// Gather double-precision (64-bit) floating-point elements from memory using 64-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERQPD ymm, vm64x, ymm</c></remarks>
-		/// <param name="base_addr"><c>double {FP64}</c></param>
-		/// <param name="vindex"><c>__m256i {SI64}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_i64gather_pd(double* base_addr, __m256i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector256(base_addr, vindex.SI64, (byte)scale);
-
-		/// <summary>
-		/// Gather single-precision (32-bit) floating-point elements from memory using 64-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst". "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERQPS xmm, vm64y, xmm</c></remarks>
-		/// <param name="base_addr"><c>float {FP32}</c></param>
-		/// <param name="vindex"><c>__m256i {SI64}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm256_i64gather_ps(float* base_addr, __m256i vindex, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherVector128(base_addr, vindex.SI64, (byte)scale);
-
-		/// <summary>
-		/// Copy "a" to "dst", then insert 128 bits (composed of integer data) from "b" into "dst" at the location specified by "imm8".
-		/// </summary>
-		/// <remarks><c>VINSERTI128 ymm, ymm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <param name="b"><c>__m128i {M128}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {M128}</c></returns>
-		public static __m256i _mm256_inserti128_si256(__m256i a, __m128i b, int imm8) => System.Runtime.Intrinsics.X86.Avx2.InsertVector128(a.SI8, b.SI8, (byte)imm8);
-
-		/// <summary>
-		/// Multiply packed signed 16-bit integers in "a" and "b", producing intermediate signed 32-bit integers. Horizontally add adjacent pairs of intermediate 32-bit integers, and pack the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMADDWD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {SI32}</c></returns>
-		public static __m256i _mm256_madd_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.MultiplyAddAdjacent(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Vertically multiply each unsigned 8-bit integer from "a" with the corresponding signed 8-bit integer from "b", producing intermediate signed 16-bit integers. Horizontally add adjacent pairs of intermediate signed 16-bit integers, and pack the saturated results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMADDUBSW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {SI8}</c></param>
-		/// <returns><c>__m256i dst {SI16}</c></returns>
-		public static __m256i _mm256_maddubs_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.MultiplyAddAdjacent(a.UI8, b.SI8);
-
-		/// <summary>
-		/// Gather 32-bit integers from memory using 32-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERDD ymm, vm32x, ymm</c></remarks>
-		/// <param name="src"><c>__m256i {UI32}</c></param>
-		/// <param name="base_addr"><c>int {UI32}</c></param>
-		/// <param name="vindex"><c>__m256i {SI32}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_mask_i32gather_epi32(__m256i src, int* base_addr, __m256i vindex, __m256i mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector256(src.UI32, (uint*)base_addr, vindex.SI32, mask.UI32, (byte)scale);
-
-		/// <summary>
-		/// Gather 64-bit integers from memory using 32-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERDQ ymm, vm32x, ymm</c></remarks>
-		/// <param name="src"><c>__m256i {UI64}</c></param>
-		/// <param name="base_addr"><c>long {UI64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_mask_i32gather_epi64(__m256i src, long* base_addr, __m128i vindex, __m256i mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector256(src.UI64, (ulong*)base_addr, vindex.SI32, mask.UI64, (byte)scale);
-
-		/// <summary>
-		/// Gather double-precision (64-bit) floating-point elements from memory using 32-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERDPD ymm, vm32x, ymm</c></remarks>
-		/// <param name="src"><c>__m256d {FP64}</c></param>
-		/// <param name="base_addr"><c>double {FP64}</c></param>
-		/// <param name="vindex"><c>__m128i {SI32}</c></param>
-		/// <param name="mask"><c>__m256d {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_mask_i32gather_pd(__m256d src, double* base_addr, __m128i vindex, __m256d mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector256(src.FP64, base_addr, vindex.SI32, mask.FP64, (byte)scale);
-
-		/// <summary>
-		/// Gather single-precision (32-bit) floating-point elements from memory using 32-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 32-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERDPS ymm, vm32x, ymm</c></remarks>
-		/// <param name="src"><c>__m256 {FP32}</c></param>
-		/// <param name="base_addr"><c>float {FP32}</c></param>
-		/// <param name="vindex"><c>__m256i {SI32}</c></param>
-		/// <param name="mask"><c>__m256 {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_mask_i32gather_ps(__m256 src, float* base_addr, __m256i vindex, __m256 mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector256(src.FP32, base_addr, vindex.SI32, mask.FP32, (byte)scale);
-
-		/// <summary>
-		/// Gather 32-bit integers from memory using 64-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERQD xmm, vm64y, xmm</c></remarks>
-		/// <param name="src"><c>__m128i {UI32}</c></param>
-		/// <param name="base_addr"><c>int {UI32}</c></param>
-		/// <param name="vindex"><c>__m256i {SI64}</c></param>
-		/// <param name="mask"><c>__m128i {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm256_mask_i64gather_epi32(__m128i src, int* base_addr, __m256i vindex, __m128i mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector128(src.UI32, (uint*)base_addr, vindex.SI64, mask.UI32, (byte)scale);
-
-		/// <summary>
-		/// Gather 64-bit integers from memory using 64-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VPGATHERQQ ymm, vm64x, ymm</c></remarks>
-		/// <param name="src"><c>__m256i {UI64}</c></param>
-		/// <param name="base_addr"><c>long {UI64}</c></param>
-		/// <param name="vindex"><c>__m256i {SI64}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_mask_i64gather_epi64(__m256i src, long* base_addr, __m256i vindex, __m256i mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector256(src.UI64, (ulong*)base_addr, vindex.SI64, mask.UI64, (byte)scale);
-
-		/// <summary>
-		/// Gather double-precision (64-bit) floating-point elements from memory using 64-bit indices. 64-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERQPD ymm, vm64x, ymm</c></remarks>
-		/// <param name="src"><c>__m256d {FP64}</c></param>
-		/// <param name="base_addr"><c>double {FP64}</c></param>
-		/// <param name="vindex"><c>__m256i {SI64}</c></param>
-		/// <param name="mask"><c>__m256d {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_mask_i64gather_pd(__m256d src, double* base_addr, __m256i vindex, __m256d mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector256(src.FP64, base_addr, vindex.SI64, mask.FP64, (byte)scale);
-
-		/// <summary>
-		/// Gather single-precision (32-bit) floating-point elements from memory using 64-bit indices. 32-bit elements are loaded from addresses starting at "base_addr" and offset by each 64-bit element in "vindex" (each index is scaled by the factor in "scale"). Gathered elements are merged into "dst" using "mask" (elements are copied from "src" when the highest bit is not set in the corresponding element). "scale" should be 1, 2, 4 or 8.
-		/// </summary>
-		/// <remarks><c>VGATHERQPS xmm, vm64y, xmm</c></remarks>
-		/// <param name="src"><c>__m128 {FP32}</c></param>
-		/// <param name="base_addr"><c>float {FP32}</c></param>
-		/// <param name="vindex"><c>__m256i {SI64}</c></param>
-		/// <param name="mask"><c>__m128 {MASK}</c></param>
-		/// <param name="scale"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm256_mask_i64gather_ps(__m128 src, float* base_addr, __m256i vindex, __m128 mask, int scale) => System.Runtime.Intrinsics.X86.Avx2.GatherMaskVector128(src.FP32, base_addr, vindex.SI64, mask.FP32, (byte)scale);
-
-		/// <summary>
-		/// Load packed 32-bit integers from memory into "dst" using "mask" (elements are zeroed out when the highest bit is not set in the corresponding element).
-		/// </summary>
-		/// <remarks><c>VPMASKMOVD ymm, ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>int {UI32}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_maskload_epi32(int* mem_addr, __m256i mask) => System.Runtime.Intrinsics.X86.Avx2.MaskLoad((uint*)mem_addr, mask.UI32);
-
-		/// <summary>
-		/// Load packed 64-bit integers from memory into "dst" using "mask" (elements are zeroed out when the highest bit is not set in the corresponding element).
-		/// </summary>
-		/// <remarks><c>VPMASKMOVQ ymm, ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>long {UI64}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_maskload_epi64(long* mem_addr, __m256i mask) => System.Runtime.Intrinsics.X86.Avx2.MaskLoad((ulong*)mem_addr, mask.UI64);
-
-		/// <summary>
-		/// Store packed 32-bit integers from "a" into memory using "mask" (elements are not stored when the highest bit is not set in the corresponding element).
-		/// </summary>
-		/// <remarks><c>VPMASKMOVD m256, ymm, ymm</c></remarks>
-		/// <param name="mem_addr"><c>int {UI32}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_maskstore_epi32(int* mem_addr, __m256i mask, __m256i a) => System.Runtime.Intrinsics.X86.Avx2.MaskStore((uint*)mem_addr, mask.UI32, a.UI32);
-
-		/// <summary>
-		/// Store packed 64-bit integers from "a" into memory using "mask" (elements are not stored when the highest bit is not set in the corresponding element).
-		/// </summary>
-		/// <remarks><c>VPMASKMOVQ m256, ymm, ymm</c></remarks>
-		/// <param name="mem_addr"><c>long {UI64}</c></param>
-		/// <param name="mask"><c>__m256i {MASK}</c></param>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm256_maskstore_epi64(long* mem_addr, __m256i mask, __m256i a) => System.Runtime.Intrinsics.X86.Avx2.MaskStore((ulong*)mem_addr, mask.UI64, a.UI64);
-
-		/// <summary>
-		/// Compare packed signed 16-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMAXSW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_max_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Max(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Compare packed signed 32-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMAXSD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <param name="b"><c>__m256i {SI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_max_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Max(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Compare packed signed 8-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMAXSB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI8}</c></param>
-		/// <param name="b"><c>__m256i {SI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_max_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Max(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Compare packed unsigned 16-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMAXUW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_max_epu16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Max(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Compare packed unsigned 32-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMAXUD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_max_epu32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Max(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Compare packed unsigned 8-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMAXUB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_max_epu8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Max(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Compare packed signed 16-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMINSW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_min_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Min(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Compare packed signed 32-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMINSD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <param name="b"><c>__m256i {SI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_min_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Min(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Compare packed signed 8-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMINSB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI8}</c></param>
-		/// <param name="b"><c>__m256i {SI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_min_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Min(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Compare packed unsigned 16-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMINUW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_min_epu16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Min(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Compare packed unsigned 32-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMINUD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_min_epu32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Min(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Compare packed unsigned 8-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>VPMINUB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_min_epu8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Min(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Create mask from the most significant bit of each 8-bit element in "a", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>VPMOVMSKB r32, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm256_movemask_epi8(__m256i a) => System.Runtime.Intrinsics.X86.Avx2.MoveMask(a.UI8);
-
-		/// <summary>
-		/// Compute the sum of absolute differences (SADs) of quadruplets of unsigned 8-bit integers in "a" compared to those in "b", and store the 16-bit results in "dst".	Eight SADs are performed for each 128-bit lane using one quadruplet from "b" and eight quadruplets from "a". One quadruplet is selected from "b" starting at on the offset specified in "imm8". Eight quadruplets are formed from sequential 8-bit integers selected from "a" starting at the offset specified in "imm8".
-		/// </summary>
-		/// <remarks><c>VMPSADBW ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_mpsadbw_epu8(__m256i a, __m256i b, int imm8) => System.Runtime.Intrinsics.X86.Avx2.MultipleSumAbsoluteDifferences(a.UI8, b.UI8, (byte)imm8);
-
-		/// <summary>
-		/// Multiply the low signed 32-bit integers from each packed 64-bit element in "a" and "b", and store the signed 64-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMULDQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <param name="b"><c>__m256i {SI32}</c></param>
-		/// <returns><c>__m256i dst {SI64}</c></returns>
-		public static __m256i _mm256_mul_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Multiply(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Multiply the low unsigned 32-bit integers from each packed 64-bit element in "a" and "b", and store the unsigned 64-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>VPMULUDQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_mul_epu32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Multiply(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Multiply the packed signed 16-bit integers in "a" and "b", producing intermediate 32-bit integers, and store the high 16 bits of the intermediate integers in "dst".
-		/// </summary>
-		/// <remarks><c>VPMULHW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_mulhi_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.MultiplyHigh(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Multiply the packed unsigned 16-bit integers in "a" and "b", producing intermediate 32-bit integers, and store the high 16 bits of the intermediate integers in "dst".
-		/// </summary>
-		/// <remarks><c>VPMULHUW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_mulhi_epu16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.MultiplyHigh(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Multiply packed signed 16-bit integers in "a" and "b", producing intermediate signed 32-bit integers. Truncate each intermediate integer to the 18 most significant bits, round by adding 1, and store bits [16:1] to "dst".
-		/// </summary>
-		/// <remarks><c>VPMULHRSW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_mulhrs_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.MultiplyHighRoundScale(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Multiply the packed signed 16-bit integers in "a" and "b", producing intermediate 32-bit integers, and store the low 16 bits of the intermediate integers in "dst".
-		/// </summary>
-		/// <remarks><c>VPMULLW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_mullo_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.MultiplyLow(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Multiply the packed signed 32-bit integers in "a" and "b", producing intermediate 64-bit integers, and store the low 32 bits of the intermediate integers in "dst".
-		/// </summary>
-		/// <remarks><c>VPMULLD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <param name="b"><c>__m256i {SI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_mullo_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.MultiplyLow(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Compute the bitwise OR of 256 bits (representing integer data) in "a" and "b", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>VPOR ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <param name="b"><c>__m256i {M256}</c></param>
-		/// <returns><c>__m256i dst {M256}</c></returns>
-		public static __m256i _mm256_or_si256(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Or(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Convert packed signed 16-bit integers from "a" and "b" to packed 8-bit integers using signed saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPACKSSWB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {SI8}</c></returns>
-		public static __m256i _mm256_packs_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.PackSignedSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Convert packed signed 32-bit integers from "a" and "b" to packed 16-bit integers using signed saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPACKSSDW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <param name="b"><c>__m256i {SI32}</c></param>
-		/// <returns><c>__m256i dst {SI16}</c></returns>
-		public static __m256i _mm256_packs_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.PackSignedSaturate(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Convert packed signed 16-bit integers from "a" and "b" to packed 8-bit integers using unsigned saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPACKUSWB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_packus_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.PackUnsignedSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Convert packed signed 32-bit integers from "a" and "b" to packed 16-bit integers using unsigned saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPACKUSDW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <param name="b"><c>__m256i {SI32}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_packus_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.PackUnsignedSaturate(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Shuffle 128-bits (composed of integer data) selected by "imm8" from "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERM2I128 ymm, ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <param name="b"><c>__m256i {M256}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {M256}</c></returns>
-		public static __m256i _mm256_permute2x128_si256(__m256i a, __m256i b, int imm8) => System.Runtime.Intrinsics.X86.Avx2.Permute2x128(a.SI8, b.SI8, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle 64-bit integers in "a" across lanes using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERMQ ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_permute4x64_epi64(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.Permute4x64(a.UI64, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle double-precision (64-bit) floating-point elements in "a" across lanes using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERMPD ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_permute4x64_pd(__m256d a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.Permute4x64(a.FP64, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle 32-bit integers in "a" across lanes using the corresponding index in "idx", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPERMD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="idx"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_permutevar8x32_epi32(__m256i a, __m256i idx) => System.Runtime.Intrinsics.X86.Avx2.PermuteVar8x32(a.UI32, idx.UI32);
-
-		/// <summary>
-		/// Shuffle single-precision (32-bit) floating-point elements in "a" across lanes using the corresponding index in "idx".
-		/// </summary>
-		/// <remarks><c>VPERMPS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="idx"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_permutevar8x32_ps(__m256 a, __m256i idx) => System.Runtime.Intrinsics.X86.Avx2.PermuteVar8x32(a.FP32, idx.SI32);
-
-		/// <summary>
-		/// Compute the absolute differences of packed unsigned 8-bit integers in "a" and "b", then horizontally sum each consecutive 8 differences to produce four unsigned 16-bit integers, and pack these unsigned 16-bit integers in the low 16 bits of 64-bit elements in "dst".
-		/// </summary>
-		/// <remarks><c>VPSADBW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_sad_epu8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.SumAbsoluteDifferences(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Shuffle 32-bit integers in "a" within 128-bit lanes using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSHUFD ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_shuffle_epi32(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.Shuffle(a.UI32, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle 8-bit integers in "a" within 128-bit lanes according to shuffle control mask in the corresponding 8-bit element of "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSHUFB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_shuffle_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Shuffle(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Shuffle 16-bit integers in the high 64 bits of 128-bit lanes of "a" using the control in "imm8". Store the results in the high 64 bits of 128-bit lanes of "dst", with the low 64 bits of 128-bit lanes being copied from from "a" to "dst".
-		/// </summary>
-		/// <remarks><c>VPSHUFHW ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_shufflehi_epi16(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShuffleHigh(a.UI16, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle 16-bit integers in the low 64 bits of 128-bit lanes of "a" using the control in "imm8". Store the results in the low 64 bits of 128-bit lanes of "dst", with the high 64 bits of 128-bit lanes being copied from from "a" to "dst".
-		/// </summary>
-		/// <remarks><c>VPSHUFLW ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_shufflelo_epi16(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShuffleLow(a.UI16, (byte)imm8);
-
-		/// <summary>
-		/// Negate packed signed 16-bit integers in "a" when the corresponding signed 16-bit integer in "b" is negative, and store the results in "dst". Element in "dst" are zeroed out when the corresponding element in "b" is zero.
-		/// </summary>
-		/// <remarks><c>VPSIGNW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_sign_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Sign(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Negate packed signed 32-bit integers in "a" when the corresponding signed 32-bit integer in "b" is negative, and store the results in "dst". Element in "dst" are zeroed out when the corresponding element in "b" is zero.
-		/// </summary>
-		/// <remarks><c>VPSIGND ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <param name="b"><c>__m256i {SI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_sign_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Sign(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Negate packed signed 8-bit integers in "a" when the corresponding signed 8-bit integer in "b" is negative, and store the results in "dst". Element in "dst" are zeroed out when the corresponding element in "b" is zero.
-		/// </summary>
-		/// <remarks><c>VPSIGNB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI8}</c></param>
-		/// <param name="b"><c>__m256i {SI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_sign_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Sign(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Shift packed 16-bit integers in "a" left by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSLLW ymm, ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="count"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_sll_epi16(__m256i a, __m128i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftLeftLogical(a.UI16, count.UI16);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" left by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSLLD ymm, ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="count"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_sll_epi32(__m256i a, __m128i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftLeftLogical(a.UI32, count.UI32);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" left by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSLLQ ymm, ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="count"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_sll_epi64(__m256i a, __m128i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftLeftLogical(a.UI64, count.UI64);
-
-		/// <summary>
-		/// Shift packed 16-bit integers in "a" left by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSLLW ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_slli_epi16(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShiftLeftLogical(a.UI16, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" left by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSLLD ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_slli_epi32(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShiftLeftLogical(a.UI32, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" left by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSLLQ ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_slli_epi64(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShiftLeftLogical(a.UI64, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" left by the amount specified by the corresponding element in "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSLLVD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="count"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_sllv_epi32(__m256i a, __m256i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftLeftLogicalVariable(a.UI32, count.UI32);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" left by the amount specified by the corresponding element in "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSLLVQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="count"><c>__m256i {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_sllv_epi64(__m256i a, __m256i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftLeftLogicalVariable(a.UI64, count.UI64);
-
-		/// <summary>
-		/// Shift packed 16-bit integers in "a" right by "imm8" while shifting in sign bits, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRAW ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_srai_epi16(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightArithmetic(a.SI16, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" right by "imm8" while shifting in sign bits, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRAD ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_srai_epi32(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightArithmetic(a.SI32, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" right by the amount specified by the corresponding element in "count" while shifting in sign bits, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRAVD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI32}</c></param>
-		/// <param name="count"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_srav_epi32(__m256i a, __m256i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightArithmeticVariable(a.SI32, count.UI32);
-
-		/// <summary>
-		/// Shift packed 16-bit integers in "a" right by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRLW ymm, ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="count"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_srl_epi16(__m256i a, __m128i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightLogical(a.UI16, count.UI16);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" right by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRLD ymm, ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="count"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_srl_epi32(__m256i a, __m128i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightLogical(a.UI32, count.UI32);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" right by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRLQ ymm, ymm, xmm</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="count"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_srl_epi64(__m256i a, __m128i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightLogical(a.UI64, count.UI64);
-
-		/// <summary>
-		/// Shift packed 16-bit integers in "a" right by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRLW ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_srli_epi16(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightLogical(a.UI16, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" right by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRLD ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_srli_epi32(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightLogical(a.UI32, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" right by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRLQ ymm, ymm, imm8</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_srli_epi64(__m256i a, int imm8) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightLogical(a.UI64, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" right by the amount specified by the corresponding element in "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRLVD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="count"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_srlv_epi32(__m256i a, __m256i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightLogicalVariable(a.UI32, count.UI32);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" right by the amount specified by the corresponding element in "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSRLVQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="count"><c>__m256i {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_srlv_epi64(__m256i a, __m256i count) => System.Runtime.Intrinsics.X86.Avx2.ShiftRightLogicalVariable(a.UI64, count.UI64);
-
-		/// <summary>
-		/// Load 256-bits of integer data from memory into "dst" using a non-temporal memory hint.	"mem_addr" must be aligned on a 32-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>VMOVNTDQA ymm, m256</c></remarks>
-		/// <param name="mem_addr"><c>__m256i {M256}</c></param>
-		/// <returns><c>__m256i dst {M256}</c></returns>
-		public static __m256i _mm256_stream_load_si256(__m256i* mem_addr) => System.Runtime.Intrinsics.X86.Avx2.LoadAlignedVector256NonTemporal((sbyte*)mem_addr);
-
-		/// <summary>
-		/// Subtract packed 16-bit integers in "b" from packed 16-bit integers in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSUBW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_sub_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Subtract(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Subtract packed 32-bit integers in "b" from packed 32-bit integers in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSUBD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_sub_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Subtract(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Subtract packed 64-bit integers in "b" from packed 64-bit integers in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSUBQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="b"><c>__m256i {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_sub_epi64(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Subtract(a.UI64, b.UI64);
-
-		/// <summary>
-		/// Subtract packed 8-bit integers in "b" from packed 8-bit integers in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSUBB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_sub_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Subtract(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Subtract packed signed 16-bit integers in "b" from packed 16-bit integers in "a" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSUBSW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI16}</c></param>
-		/// <param name="b"><c>__m256i {SI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_subs_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.SubtractSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Subtract packed signed 8-bit integers in "b" from packed 8-bit integers in "a" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSUBSB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {SI8}</c></param>
-		/// <param name="b"><c>__m256i {SI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_subs_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.SubtractSaturate(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Subtract packed unsigned 16-bit integers in "b" from packed unsigned 16-bit integers in "a" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSUBUSW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_subs_epu16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.SubtractSaturate(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Subtract packed unsigned 8-bit integers in "b" from packed unsigned 8-bit integers in "a" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPSUBUSB ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_subs_epu8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.SubtractSaturate(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Unpack and interleave 16-bit integers from the high half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPUNPCKHWD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_unpackhi_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.UnpackHigh(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Unpack and interleave 32-bit integers from the high half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPUNPCKHDQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_unpackhi_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.UnpackHigh(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Unpack and interleave 64-bit integers from the high half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPUNPCKHQDQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="b"><c>__m256i {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_unpackhi_epi64(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.UnpackHigh(a.UI64, b.UI64);
-
-		/// <summary>
-		/// Unpack and interleave 8-bit integers from the high half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPUNPCKHBW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_unpackhi_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.UnpackHigh(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Unpack and interleave 16-bit integers from the low half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPUNPCKLWD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI16}</c></param>
-		/// <param name="b"><c>__m256i {UI16}</c></param>
-		/// <returns><c>__m256i dst {UI16}</c></returns>
-		public static __m256i _mm256_unpacklo_epi16(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.UnpackLow(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Unpack and interleave 32-bit integers from the low half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPUNPCKLDQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI32}</c></param>
-		/// <param name="b"><c>__m256i {UI32}</c></param>
-		/// <returns><c>__m256i dst {UI32}</c></returns>
-		public static __m256i _mm256_unpacklo_epi32(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.UnpackLow(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Unpack and interleave 64-bit integers from the low half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPUNPCKLQDQ ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI64}</c></param>
-		/// <param name="b"><c>__m256i {UI64}</c></param>
-		/// <returns><c>__m256i dst {UI64}</c></returns>
-		public static __m256i _mm256_unpacklo_epi64(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.UnpackLow(a.UI64, b.UI64);
-
-		/// <summary>
-		/// Unpack and interleave 8-bit integers from the low half of each 128-bit lane in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VPUNPCKLBW ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {UI8}</c></param>
-		/// <param name="b"><c>__m256i {UI8}</c></param>
-		/// <returns><c>__m256i dst {UI8}</c></returns>
-		public static __m256i _mm256_unpacklo_epi8(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.UnpackLow(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Compute the bitwise XOR of 256 bits (representing integer data) in "a" and "b", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>VPXOR ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256i {M256}</c></param>
-		/// <param name="b"><c>__m256i {M256}</c></param>
-		/// <returns><c>__m256i dst {M256}</c></returns>
-		public static __m256i _mm256_xor_si256(__m256i a, __m256i b) => System.Runtime.Intrinsics.X86.Avx2.Xor(a.SI8, b.SI8);
-
-	}
-}
diff --git a/src/External/RawIntrinsics/FMA.cs b/src/External/RawIntrinsics/FMA.cs
deleted file mode 100644
index acad284..0000000
--- a/src/External/RawIntrinsics/FMA.cs
+++ /dev/null
@@ -1,326 +0,0 @@
-namespace RawIntrinsics
-{
-	public static unsafe partial class FMA
-	{
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", add the intermediate result to packed elements in "c", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMADD132PD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="c"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_fmadd_pd(__m128d a, __m128d b, __m128d c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAdd(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", add the intermediate result to packed elements in "c", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMADD132PS xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="c"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_fmadd_ps(__m128 a, __m128 b, __m128 c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAdd(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply the lower double-precision (64-bit) floating-point elements in "a" and "b", and add the intermediate result to the lower element in "c". Store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>VFMADD132SD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="c"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_fmadd_sd(__m128d a, __m128d b, __m128d c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddScalar(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply the lower single-precision (32-bit) floating-point elements in "a" and "b", and add the intermediate result to the lower element in "c". Store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>VFMADD132SS xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="c"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_fmadd_ss(__m128 a, __m128 b, __m128 c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddScalar(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", alternatively add and subtract packed elements in "c" to/from the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMADDSUB132PD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="c"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_fmaddsub_pd(__m128d a, __m128d b, __m128d c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddSubtract(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", alternatively add and subtract packed elements in "c" to/from the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMADDSUB132PS xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="c"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_fmaddsub_ps(__m128 a, __m128 b, __m128 c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddSubtract(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", subtract packed elements in "c" from the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMSUB132PD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="c"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_fmsub_pd(__m128d a, __m128d b, __m128d c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtract(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", subtract packed elements in "c" from the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMSUB132PS xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="c"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_fmsub_ps(__m128 a, __m128 b, __m128 c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtract(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply the lower double-precision (64-bit) floating-point elements in "a" and "b", and subtract the lower element in "c" from the intermediate result. Store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>VFMSUB132SD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="c"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_fmsub_sd(__m128d a, __m128d b, __m128d c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractScalar(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply the lower single-precision (32-bit) floating-point elements in "a" and "b", and subtract the lower element in "c" from the intermediate result. Store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>VFMSUB132SS xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="c"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_fmsub_ss(__m128 a, __m128 b, __m128 c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractScalar(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", alternatively subtract and add packed elements in "c" from/to the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMSUBADD132PD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="c"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_fmsubadd_pd(__m128d a, __m128d b, __m128d c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractAdd(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", alternatively subtract and add packed elements in "c" from/to the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMSUBADD132PS xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="c"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_fmsubadd_ps(__m128 a, __m128 b, __m128 c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractAdd(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", add the negated intermediate result to packed elements in "c", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFNMADD132PD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="c"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_fnmadd_pd(__m128d a, __m128d b, __m128d c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddNegated(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", add the negated intermediate result to packed elements in "c", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFNMADD132PS xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="c"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_fnmadd_ps(__m128 a, __m128 b, __m128 c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddNegated(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply the lower double-precision (64-bit) floating-point elements in "a" and "b", and add the negated intermediate result to the lower element in "c". Store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>VFNMADD132SD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="c"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_fnmadd_sd(__m128d a, __m128d b, __m128d c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddNegatedScalar(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply the lower single-precision (32-bit) floating-point elements in "a" and "b", and add the negated intermediate result to the lower element in "c". Store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>VFNMADD132SS xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="c"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_fnmadd_ss(__m128 a, __m128 b, __m128 c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddNegatedScalar(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", subtract packed elements in "c" from the negated intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFNMSUB132PD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="c"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_fnmsub_pd(__m128d a, __m128d b, __m128d c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractNegated(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", subtract packed elements in "c" from the negated intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFNMSUB132PS xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="c"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_fnmsub_ps(__m128 a, __m128 b, __m128 c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractNegated(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply the lower double-precision (64-bit) floating-point elements in "a" and "b", and subtract the lower element in "c" from the negated intermediate result. Store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>VFNMSUB132SD xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="c"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_fnmsub_sd(__m128d a, __m128d b, __m128d c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractNegatedScalar(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply the lower single-precision (32-bit) floating-point elements in "a" and "b", and subtract the lower element in "c" from the negated intermediate result. Store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>VFNMSUB132SS xmm, xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="c"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_fnmsub_ss(__m128 a, __m128 b, __m128 c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractNegatedScalar(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", add the intermediate result to packed elements in "c", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMADD132PD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <param name="c"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_fmadd_pd(__m256d a, __m256d b, __m256d c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAdd(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", add the intermediate result to packed elements in "c", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMADD132PS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="c"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_fmadd_ps(__m256 a, __m256 b, __m256 c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAdd(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", alternatively add and subtract packed elements in "c" to/from the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMADDSUB132PD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <param name="c"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_fmaddsub_pd(__m256d a, __m256d b, __m256d c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddSubtract(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", alternatively add and subtract packed elements in "c" to/from the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMADDSUB132PS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="c"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_fmaddsub_ps(__m256 a, __m256 b, __m256 c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddSubtract(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", subtract packed elements in "c" from the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMSUB132PD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <param name="c"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_fmsub_pd(__m256d a, __m256d b, __m256d c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtract(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", subtract packed elements in "c" from the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMSUB132PS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="c"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_fmsub_ps(__m256 a, __m256 b, __m256 c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtract(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", alternatively subtract and add packed elements in "c" from/to the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMSUBADD132PD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <param name="c"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_fmsubadd_pd(__m256d a, __m256d b, __m256d c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractAdd(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", alternatively subtract and add packed elements in "c" from/to the intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFMSUBADD132PS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="c"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_fmsubadd_ps(__m256 a, __m256 b, __m256 c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractAdd(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", add the negated intermediate result to packed elements in "c", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFNMADD132PD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <param name="c"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_fnmadd_pd(__m256d a, __m256d b, __m256d c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddNegated(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", add the negated intermediate result to packed elements in "c", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFNMADD132PS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="c"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_fnmadd_ps(__m256 a, __m256 b, __m256 c) => System.Runtime.Intrinsics.X86.Fma.MultiplyAddNegated(a.FP32, b.FP32, c.FP32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", subtract packed elements in "c" from the negated intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFNMSUB132PD ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256d {FP64}</c></param>
-		/// <param name="b"><c>__m256d {FP64}</c></param>
-		/// <param name="c"><c>__m256d {FP64}</c></param>
-		/// <returns><c>__m256d dst {FP64}</c></returns>
-		public static __m256d _mm256_fnmsub_pd(__m256d a, __m256d b, __m256d c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractNegated(a.FP64, b.FP64, c.FP64);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", subtract packed elements in "c" from the negated intermediate result, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>VFNMSUB132PS ymm, ymm, ymm</c></remarks>
-		/// <param name="a"><c>__m256 {FP32}</c></param>
-		/// <param name="b"><c>__m256 {FP32}</c></param>
-		/// <param name="c"><c>__m256 {FP32}</c></param>
-		/// <returns><c>__m256 dst {FP32}</c></returns>
-		public static __m256 _mm256_fnmsub_ps(__m256 a, __m256 b, __m256 c) => System.Runtime.Intrinsics.X86.Fma.MultiplySubtractNegated(a.FP32, b.FP32, c.FP32);
-
-	}
-}
diff --git a/src/External/RawIntrinsics/MMX.ManuallyAdded.cs b/src/External/RawIntrinsics/MMX.ManuallyAdded.cs
deleted file mode 100644
index c1a5938..0000000
--- a/src/External/RawIntrinsics/MMX.ManuallyAdded.cs
+++ /dev/null
@@ -1,11 +0,0 @@
-﻿namespace RawIntrinsics
-{
-	public static partial class MMX
-	{
-		/// <summary>
-		/// Return vector of type __m64 with all elements set to zero.
-		/// </summary>
-		/// <returns><c>__m64 dst {FP32}</c></returns>
-		public static __m64 _mm_setzero_si64() => System.Runtime.Intrinsics.Vector64<float>.Zero;
-	}
-}
\ No newline at end of file
diff --git a/src/External/RawIntrinsics/MMX.cs b/src/External/RawIntrinsics/MMX.cs
deleted file mode 100644
index b8071c7..0000000
--- a/src/External/RawIntrinsics/MMX.cs
+++ /dev/null
@@ -1,65 +0,0 @@
-namespace RawIntrinsics
-{
-	public static unsafe partial class MMX
-	{
-		/// <summary>
-		/// Broadcast 16-bit integer "a" to all all elements of "dst".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>short {UI16}</c></param>
-		/// <returns><c>__m64 dst {FP32}</c></returns>
-		public static __m64 _mm_set1_pi16(short a) => System.Runtime.Intrinsics.Vector64.Create((ushort)a);
-
-		/// <summary>
-		/// Broadcast 32-bit integer "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>int {UI32}</c></param>
-		/// <returns><c>__m64 dst {FP32}</c></returns>
-		public static __m64 _mm_set1_pi32(int a) => System.Runtime.Intrinsics.Vector64.Create((uint)a);
-
-		/// <summary>
-		/// Broadcast 8-bit integer "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>byte {UI8}</c></param>
-		/// <returns><c>__m64 dst {FP32}</c></returns>
-		public static __m64 _mm_set1_pi8(byte a) => System.Runtime.Intrinsics.Vector64.Create(a);
-
-		/// <summary>
-		/// Set packed 16-bit integers in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e3"><c>short {UI16}</c></param>
-		/// <param name="e2"><c>short {UI16}</c></param>
-		/// <param name="e1"><c>short {UI16}</c></param>
-		/// <param name="e0"><c>short {UI16}</c></param>
-		/// <returns><c>__m64 dst {FP32}</c></returns>
-		public static __m64 _mm_setr_pi16(short e3, short e2, short e1, short e0) => System.Runtime.Intrinsics.Vector64.Create((ushort)e3, (ushort)e2, (ushort)e1, (ushort)e0);
-
-		/// <summary>
-		/// Set packed 32-bit integers in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e1"><c>int {UI32}</c></param>
-		/// <param name="e0"><c>int {UI32}</c></param>
-		/// <returns><c>__m64 dst {FP32}</c></returns>
-		public static __m64 _mm_setr_pi32(int e1, int e0) => System.Runtime.Intrinsics.Vector64.Create((uint)e1, (uint)e0);
-
-		/// <summary>
-		/// Set packed 8-bit integers in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e7"><c>byte {UI8}</c></param>
-		/// <param name="e6"><c>byte {UI8}</c></param>
-		/// <param name="e5"><c>byte {UI8}</c></param>
-		/// <param name="e4"><c>byte {UI8}</c></param>
-		/// <param name="e3"><c>byte {UI8}</c></param>
-		/// <param name="e2"><c>byte {UI8}</c></param>
-		/// <param name="e1"><c>byte {UI8}</c></param>
-		/// <param name="e0"><c>byte {UI8}</c></param>
-		/// <returns><c>__m64 dst {FP32}</c></returns>
-		public static __m64 _mm_setr_pi8(byte e7, byte e6, byte e5, byte e4, byte e3, byte e2, byte e1, byte e0) => System.Runtime.Intrinsics.Vector64.Create(e7, e6, e5, e4, e3, e2, e1, e0);
-
-	}
-}
diff --git a/src/External/RawIntrinsics/Other.cs b/src/External/RawIntrinsics/Other.cs
deleted file mode 100644
index 2d53527..0000000
--- a/src/External/RawIntrinsics/Other.cs
+++ /dev/null
@@ -1,101 +0,0 @@
-namespace RawIntrinsics
-{
-	public static unsafe partial class Other
-	{
-		/// <summary>
-		/// Perform one round of an AES decryption flow on data (state) in "a" using the round key in "RoundKey", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>AESDEC xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="RoundKey"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_aesdec_si128(__m128i a, __m128i RoundKey) => System.Runtime.Intrinsics.X86.Aes.Decrypt(a.UI8, RoundKey.UI8);
-
-		/// <summary>
-		/// Perform the last round of an AES decryption flow on data (state) in "a" using the round key in "RoundKey", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>AESDECLAST xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="RoundKey"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_aesdeclast_si128(__m128i a, __m128i RoundKey) => System.Runtime.Intrinsics.X86.Aes.DecryptLast(a.UI8, RoundKey.UI8);
-
-		/// <summary>
-		/// Perform one round of an AES encryption flow on data (state) in "a" using the round key in "RoundKey", and store the result in "dst"."
-		/// </summary>
-		/// <remarks><c>AESENC xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="RoundKey"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_aesenc_si128(__m128i a, __m128i RoundKey) => System.Runtime.Intrinsics.X86.Aes.Encrypt(a.UI8, RoundKey.UI8);
-
-		/// <summary>
-		/// Perform the last round of an AES encryption flow on data (state) in "a" using the round key in "RoundKey", and store the result in "dst"."
-		/// </summary>
-		/// <remarks><c>AESENCLAST xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="RoundKey"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_aesenclast_si128(__m128i a, __m128i RoundKey) => System.Runtime.Intrinsics.X86.Aes.EncryptLast(a.UI8, RoundKey.UI8);
-
-		/// <summary>
-		/// Perform the InvMixColumns transformation on "a" and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>AESIMC xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_aesimc_si128(__m128i a) => System.Runtime.Intrinsics.X86.Aes.InverseMixColumns(a.UI8);
-
-		/// <summary>
-		/// Assist in expanding the AES cipher key by computing steps towards generating a round key for encryption cipher using data from "a" and an 8-bit round constant specified in "imm8", and store the result in "dst"."
-		/// </summary>
-		/// <remarks><c>AESKEYGENASSIST xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_aeskeygenassist_si128(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Aes.KeygenAssist(a.UI8, (byte)imm8);
-
-		/// <summary>
-		/// Perform a carry-less multiplication of two 64-bit integers, selected from "a" and "b" according to "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PCLMULQDQ xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="b"><c>__m128i {M128}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_clmulepi64_si128(__m128i a, __m128i b, int imm8) => System.Runtime.Intrinsics.X86.Pclmulqdq.CarrylessMultiply(a.SI64, b.SI64, (byte)imm8);
-
-		/// <summary>
-		/// Count the number of bits set to 1 in unsigned 32-bit integer "a", and return that count in "dst".
-		/// </summary>
-		/// <remarks><c>POPCNT r32, r32</c></remarks>
-		/// <param name="a"><c>int {UI32}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm_popcnt_u32(int a) => (int)System.Runtime.Intrinsics.X86.Popcnt.PopCount((uint)a);
-
-		/// <summary>
-		/// Count the number of bits set to 1 in unsigned 64-bit integer "a", and return that count in "dst".
-		/// </summary>
-		/// <remarks><c>POPCNT r64, r64</c></remarks>
-		/// <param name="a"><c>long {UI64}</c></param>
-		/// <returns><c>long dst {UI64}</c></returns>
-		public static long _mm_popcnt_u64(long a) => (long)System.Runtime.Intrinsics.X86.Popcnt.X64.PopCount((ulong)a);
-
-		/// <summary>
-		/// Count the number of trailing zero bits in unsigned 32-bit integer "a", and return that count in "dst".
-		/// </summary>
-		/// <remarks><c>TZCNT r32, r32</c></remarks>
-		/// <param name="a"><c>int {UI32}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm_tzcnt_32(int a) => (int)System.Runtime.Intrinsics.X86.Bmi1.TrailingZeroCount((uint)a);
-
-		/// <summary>
-		/// Count the number of trailing zero bits in unsigned 64-bit integer "a", and return that count in "dst".
-		/// </summary>
-		/// <remarks><c>TZCNT r64, r64</c></remarks>
-		/// <param name="a"><c>long {UI64}</c></param>
-		/// <returns><c>long dst {UI64}</c></returns>
-		public static long _mm_tzcnt_64(long a) => (long)System.Runtime.Intrinsics.X86.Bmi1.X64.TrailingZeroCount((ulong)a);
-
-	}
-}
diff --git a/src/External/RawIntrinsics/RawIntrinsics.csproj b/src/External/RawIntrinsics/RawIntrinsics.csproj
deleted file mode 100644
index 2e66377..0000000
--- a/src/External/RawIntrinsics/RawIntrinsics.csproj
+++ /dev/null
@@ -1,8 +0,0 @@
-<Project Sdk="Microsoft.NET.Sdk">
-
-    <PropertyGroup>
-        <TargetFramework>net7.0</TargetFramework>
-        <AllowUnsafeBlocks>true</AllowUnsafeBlocks>
-    </PropertyGroup>
-
-</Project>
diff --git a/src/External/RawIntrinsics/SSE.ManuallyAdded.cs b/src/External/RawIntrinsics/SSE.ManuallyAdded.cs
deleted file mode 100644
index 09d9083..0000000
--- a/src/External/RawIntrinsics/SSE.ManuallyAdded.cs
+++ /dev/null
@@ -1,11 +0,0 @@
-﻿namespace RawIntrinsics
-{
-	public static partial class SSE
-	{
-		/// <summary>
-		/// Return vector of type __m128 with all elements set to zero.
-		/// </summary>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_setzero_ps() => System.Runtime.Intrinsics.Vector128<float>.Zero;
-	}
-}
\ No newline at end of file
diff --git a/src/External/RawIntrinsics/SSE.cs b/src/External/RawIntrinsics/SSE.cs
deleted file mode 100644
index e7c090c..0000000
--- a/src/External/RawIntrinsics/SSE.cs
+++ /dev/null
@@ -1,766 +0,0 @@
-namespace RawIntrinsics
-{
-	public static unsafe partial class SSE
-	{
-		/// <summary>
-		/// Add packed single-precision (32-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>ADDPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_add_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.Add(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Add the lower single-precision (32-bit) floating-point element in "a" and "b", store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>ADDSS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_add_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.AddScalar(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise AND of packed single-precision (32-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>ANDPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_and_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.And(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise NOT of packed single-precision (32-bit) floating-point elements in "a" and then AND with "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>ANDNPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_andnot_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.AndNot(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" for equality, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpeq_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" for equality, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpeq_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" for greater-than-or-equal, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpge_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareGreaterThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" for greater-than-or-equal, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpge_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarGreaterThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" for greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpgt_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareGreaterThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" for greater-than, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpgt_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarGreaterThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" for less-than-or-equal, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmple_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareLessThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" for less-than-or-equal, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmple_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarLessThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" for less-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmplt_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareLessThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" for less-than, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmplt_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarLessThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" for not-equal, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpneq_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareNotEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" for not-equal, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpneq_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarNotEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" for not-greater-than-or-equal, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpnge_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareNotGreaterThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" for not-greater-than-or-equal, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpnge_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarNotGreaterThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" for not-greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpngt_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareNotGreaterThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" for not-greater-than, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpngt_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarNotGreaterThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" for not-less-than-or-equal, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpnle_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareNotLessThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" for not-less-than-or-equal, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpnle_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarNotLessThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" for not-less-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpnlt_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareNotLessThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" for not-less-than, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpnlt_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarNotLessThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" to see if neither is NaN, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpord_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareOrdered(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" to see if neither is NaN, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpord_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarOrdered(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b" to see if either is NaN, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpunord_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareUnordered(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b" to see if either is NaN, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cmpunord_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarUnordered(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for equality, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comieq_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarOrderedEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for greater-than-or-equal, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comige_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarOrderedGreaterThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for greater-than, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comigt_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarOrderedGreaterThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for less-than-or-equal, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comile_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarOrderedLessThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for less-than, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comilt_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarOrderedLessThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for not-equal, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comineq_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarOrderedNotEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Convert the signed 32-bit integer "b" to a single-precision (32-bit) floating-point element, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CVTSI2SS xmm, r32</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>int {SI32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cvtsi32_ss(__m128 a, int b) => System.Runtime.Intrinsics.X86.Sse.ConvertScalarToVector128Single(a.FP32, b);
-
-		/// <summary>
-		/// Convert the signed 64-bit integer "b" to a single-precision (32-bit) floating-point element, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CVTSI2SS xmm, r64</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>long {SI64}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cvtsi64_ss(__m128 a, long b) => System.Runtime.Intrinsics.X86.Sse.X64.ConvertScalarToVector128Single(a.FP32, b);
-
-		/// <summary>
-		/// Convert the lower single-precision (32-bit) floating-point element in "a" to a 32-bit integer, and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>CVTSS2SI r32, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm_cvtss_si32(__m128 a) => System.Runtime.Intrinsics.X86.Sse.ConvertToInt32(a.FP32);
-
-		/// <summary>
-		/// Convert the lower single-precision (32-bit) floating-point element in "a" to a 64-bit integer, and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>CVTSS2SI r64, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>long dst {UI64}</c></returns>
-		public static long _mm_cvtss_si64(__m128 a) => System.Runtime.Intrinsics.X86.Sse.X64.ConvertToInt64(a.FP32);
-
-		/// <summary>
-		/// Convert the lower single-precision (32-bit) floating-point element in "a" to a 32-bit integer with truncation, and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>CVTTSS2SI r32, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm_cvttss_si32(__m128 a) => System.Runtime.Intrinsics.X86.Sse.ConvertToInt32WithTruncation(a.FP32);
-
-		/// <summary>
-		/// Convert the lower single-precision (32-bit) floating-point element in "a" to a 64-bit integer with truncation, and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>CVTTSS2SI r64, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>long dst {UI64}</c></returns>
-		public static long _mm_cvttss_si64(__m128 a) => System.Runtime.Intrinsics.X86.Sse.X64.ConvertToInt64WithTruncation(a.FP32);
-
-		/// <summary>
-		/// Divide packed single-precision (32-bit) floating-point elements in "a" by packed elements in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>DIVPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_div_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.Divide(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Divide the lower single-precision (32-bit) floating-point element in "a" by the lower single-precision (32-bit) floating-point element in "b", store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>DIVSS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_div_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.DivideScalar(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Load 128-bits (composed of 4 packed single-precision (32-bit) floating-point elements) from memory into "dst".	"mem_addr" must be aligned on a 16-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>MOVAPS xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_load_ps(float* mem_addr) => System.Runtime.Intrinsics.X86.Sse.LoadAlignedVector128(mem_addr);
-
-		/// <summary>
-		/// Load a single-precision (32-bit) floating-point element from memory into the lower of "dst", and zero the upper 3 elements. "mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVSS xmm, m32</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_load_ss(float* mem_addr) => System.Runtime.Intrinsics.X86.Sse.LoadScalarVector128(mem_addr);
-
-		/// <summary>
-		/// Load 2 single-precision (32-bit) floating-point elements from memory into the upper 2 elements of "dst", and copy the lower 2 elements from "a" to "dst". "mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVHPS xmm, m64</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="mem_addr"><c>__m64 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_loadh_pi(__m128 a, __m64* mem_addr) => System.Runtime.Intrinsics.X86.Sse.LoadHigh(a.FP32, (float*)mem_addr);
-
-		/// <summary>
-		/// Load 2 single-precision (32-bit) floating-point elements from memory into the lower 2 elements of "dst", and copy the upper 2 elements from "a" to "dst". "mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVLPS xmm, m64</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="mem_addr"><c>__m64 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_loadl_pi(__m128 a, __m64* mem_addr) => System.Runtime.Intrinsics.X86.Sse.LoadLow(a.FP32, (float*)mem_addr);
-
-		/// <summary>
-		/// Load 128-bits (composed of 4 packed single-precision (32-bit) floating-point elements) from memory into "dst".	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVUPS xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_loadu_ps(float* mem_addr) => System.Runtime.Intrinsics.X86.Sse.LoadVector128(mem_addr);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>MAXPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_max_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.Max(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b", store the maximum value in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>MAXSS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_max_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.MaxScalar(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare packed single-precision (32-bit) floating-point elements in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>MINPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_min_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.Min(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point elements in "a" and "b", store the minimum value in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>MINSS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_min_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.MinScalar(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Move the lower single-precision (32-bit) floating-point element from "b" to the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>MOVSS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_move_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.MoveScalar(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Move the upper 2 single-precision (32-bit) floating-point elements from "b" to the lower 2 elements of "dst", and copy the upper 2 elements from "a" to the upper 2 elements of "dst".
-		/// </summary>
-		/// <remarks><c>MOVHLPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_movehl_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.MoveHighToLow(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Move the lower 2 single-precision (32-bit) floating-point elements from "b" to the upper 2 elements of "dst", and copy the lower 2 elements from "a" to the lower 2 elements of "dst".
-		/// </summary>
-		/// <remarks><c>MOVLHPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_movelh_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.MoveLowToHigh(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Set each bit of mask "dst" based on the most significant bit of the corresponding packed single-precision (32-bit) floating-point element in "a".
-		/// </summary>
-		/// <remarks><c>MOVMSKPS r32, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm_movemask_ps(__m128 a) => System.Runtime.Intrinsics.X86.Sse.MoveMask(a.FP32);
-
-		/// <summary>
-		/// Multiply packed single-precision (32-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>MULPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_mul_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.Multiply(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Multiply the lower single-precision (32-bit) floating-point element in "a" and "b", store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>MULSS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_mul_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.MultiplyScalar(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise OR of packed single-precision (32-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>ORPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_or_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.Or(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Fetch the line of data from memory that contains address "p" to a location in the cache heirarchy specified by the locality hint "i".
-		/// </summary>
-		/// <remarks><c>PREFETCHNTA m8</c></remarks>
-		/// <param name="p"><c>byte {UI8}</c></param>
-		/// <param name="i"><c>int {IMM}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_prefetch(byte* p, int i) => System.Runtime.Intrinsics.X86.Sse.Prefetch0((void*)p);
-
-		/// <summary>
-		/// Compute the approximate reciprocal of packed single-precision (32-bit) floating-point elements in "a", and store the results in "dst". The maximum relative error for this approximation is less than 1.5*2^-12.
-		/// </summary>
-		/// <remarks><c>RCPPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_rcp_ps(__m128 a) => System.Runtime.Intrinsics.X86.Sse.Reciprocal(a.FP32);
-
-		/// <summary>
-		/// Compute the approximate reciprocal of the lower single-precision (32-bit) floating-point element in "a", store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst". The maximum relative error for this approximation is less than 1.5*2^-12.
-		/// </summary>
-		/// <remarks><c>RCPSS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_rcp_ss(__m128 a) => System.Runtime.Intrinsics.X86.Sse.ReciprocalScalar(a.FP32);
-
-		/// <summary>
-		/// Compute the approximate reciprocal square root of packed single-precision (32-bit) floating-point elements in "a", and store the results in "dst". The maximum relative error for this approximation is less than 1.5*2^-12.
-		/// </summary>
-		/// <remarks><c>RSQRTPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_rsqrt_ps(__m128 a) => System.Runtime.Intrinsics.X86.Sse.ReciprocalSqrt(a.FP32);
-
-		/// <summary>
-		/// Compute the approximate reciprocal square root of the lower single-precision (32-bit) floating-point element in "a", store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst". The maximum relative error for this approximation is less than 1.5*2^-12.
-		/// </summary>
-		/// <remarks><c>RSQRTSS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_rsqrt_ss(__m128 a) => System.Runtime.Intrinsics.X86.Sse.ReciprocalSqrtScalar(a.FP32);
-
-		/// <summary>
-		/// Broadcast single-precision (32-bit) floating-point value "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>float {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_set1_ps(float a) => System.Runtime.Intrinsics.Vector128.Create(a);
-
-		/// <summary>
-		/// Set packed single-precision (32-bit) floating-point elements in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e3"><c>float {FP32}</c></param>
-		/// <param name="e2"><c>float {FP32}</c></param>
-		/// <param name="e1"><c>float {FP32}</c></param>
-		/// <param name="e0"><c>float {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_setr_ps(float e3, float e2, float e1, float e0) => System.Runtime.Intrinsics.Vector128.Create(e3, e2, e1, e0);
-
-		/// <summary>
-		/// Perform a serializing operation on all store-to-memory instructions that were issued prior to this instruction. Guarantees that every store instruction that precedes, in program order, is globally visible before any store instruction which follows the fence in program order.
-		/// </summary>
-		/// <remarks><c>SFENCE </c></remarks>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_sfence() => System.Runtime.Intrinsics.X86.Sse.StoreFence();
-
-		/// <summary>
-		/// Shuffle single-precision (32-bit) floating-point elements in "a" using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>SHUFPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_shuffle_ps(__m128 a, __m128 b, int imm8) => System.Runtime.Intrinsics.X86.Sse.Shuffle(a.FP32, b.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Compute the square root of packed single-precision (32-bit) floating-point elements in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>SQRTPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_sqrt_ps(__m128 a) => System.Runtime.Intrinsics.X86.Sse.Sqrt(a.FP32);
-
-		/// <summary>
-		/// Compute the square root of the lower single-precision (32-bit) floating-point element in "a", store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>SQRTSS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_sqrt_ss(__m128 a) => System.Runtime.Intrinsics.X86.Sse.SqrtScalar(a.FP32);
-
-		/// <summary>
-		/// Store 128-bits (composed of 4 packed single-precision (32-bit) floating-point elements) from "a" into memory.	"mem_addr" must be aligned on a 16-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>MOVAPS m128, xmm</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_store_ps(float* mem_addr, __m128 a) => System.Runtime.Intrinsics.X86.Sse.StoreAligned(mem_addr, a.FP32);
-
-		/// <summary>
-		/// Store the lower single-precision (32-bit) floating-point element from "a" into memory. "mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVSS m32, xmm</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_store_ss(float* mem_addr, __m128 a) => System.Runtime.Intrinsics.X86.Sse.StoreScalar(mem_addr, a.FP32);
-
-		/// <summary>
-		/// Store the upper 2 single-precision (32-bit) floating-point elements from "a" into memory.
-		/// </summary>
-		/// <remarks><c>MOVHPS m64, xmm</c></remarks>
-		/// <param name="mem_addr"><c>__m64 {FP32}</c></param>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_storeh_pi(__m64* mem_addr, __m128 a) => System.Runtime.Intrinsics.X86.Sse.StoreHigh((float*)mem_addr, a.FP32);
-
-		/// <summary>
-		/// Store the lower 2 single-precision (32-bit) floating-point elements from "a" into memory.
-		/// </summary>
-		/// <remarks><c>MOVLPS m64, xmm</c></remarks>
-		/// <param name="mem_addr"><c>__m64 {FP32}</c></param>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_storel_pi(__m64* mem_addr, __m128 a) => System.Runtime.Intrinsics.X86.Sse.StoreLow((float*)mem_addr, a.FP32);
-
-		/// <summary>
-		/// Store 128-bits (composed of 4 packed single-precision (32-bit) floating-point elements) from "a" into memory.	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVUPS m128, xmm</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_storeu_ps(float* mem_addr, __m128 a) => System.Runtime.Intrinsics.X86.Sse.Store(mem_addr, a.FP32);
-
-		/// <summary>
-		/// Store 128-bits (composed of 4 packed single-precision (32-bit) floating-point elements) from "a" into memory using a non-temporal memory hint.	"mem_addr" must be aligned on a 16-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>MOVNTPS m128, xmm</c></remarks>
-		/// <param name="mem_addr"><c>float {FP32}</c></param>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_stream_ps(float* mem_addr, __m128 a) => System.Runtime.Intrinsics.X86.Sse.StoreAlignedNonTemporal(mem_addr, a.FP32);
-
-		/// <summary>
-		/// Subtract packed single-precision (32-bit) floating-point elements in "b" from packed single-precision (32-bit) floating-point elements in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>SUBPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_sub_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.Subtract(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Subtract the lower single-precision (32-bit) floating-point element in "b" from the lower single-precision (32-bit) floating-point element in "a", store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>SUBSS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_sub_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.SubtractScalar(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for equality, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomieq_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarUnorderedEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for greater-than-or-equal, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomige_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarUnorderedGreaterThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for greater-than, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomigt_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarUnorderedGreaterThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for less-than-or-equal, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomile_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarUnorderedLessThanOrEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for less-than, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomilt_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarUnorderedLessThan(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compare the lower single-precision (32-bit) floating-point element in "a" and "b" for not-equal, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomineq_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.CompareScalarUnorderedNotEqual(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Unpack and interleave single-precision (32-bit) floating-point elements from the high half "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>UNPCKHPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_unpackhi_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.UnpackHigh(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Unpack and interleave single-precision (32-bit) floating-point elements from the low half of "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>UNPCKLPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_unpacklo_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.UnpackLow(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Compute the bitwise XOR of packed single-precision (32-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>XORPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_xor_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse.Xor(a.FP32, b.FP32);
-
-	}
-}
diff --git a/src/External/RawIntrinsics/SSE2.ManuallyAdded.cs b/src/External/RawIntrinsics/SSE2.ManuallyAdded.cs
deleted file mode 100644
index de75d41..0000000
--- a/src/External/RawIntrinsics/SSE2.ManuallyAdded.cs
+++ /dev/null
@@ -1,17 +0,0 @@
-﻿namespace RawIntrinsics
-{
-	public static partial class SSE2
-	{
-		/// <summary>
-		/// Return vector of type __m128d with all elements set to zero.
-		/// </summary>
-		/// <returns><c>__m128d dst {M128}</c></returns>
-		public static __m128d _mm_setzero_pd() => System.Runtime.Intrinsics.Vector128<double>.Zero;
-		
-		/// <summary>
-		/// Return vector of type __m128i with all elements set to zero.
-		/// </summary>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_setzero_si128() => System.Runtime.Intrinsics.Vector128<byte>.Zero;
-	}
-}
\ No newline at end of file
diff --git a/src/External/RawIntrinsics/SSE2.cs b/src/External/RawIntrinsics/SSE2.cs
deleted file mode 100644
index e25c4fc..0000000
--- a/src/External/RawIntrinsics/SSE2.cs
+++ /dev/null
@@ -1,1714 +0,0 @@
-namespace RawIntrinsics
-{
-	public static unsafe partial class SSE2
-	{
-		/// <summary>
-		/// Add packed 16-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PADDW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_add_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Add(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Add packed 32-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PADDD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="b"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_add_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Add(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Add packed 64-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PADDQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="b"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_add_epi64(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Add(a.UI64, b.UI64);
-
-		/// <summary>
-		/// Add packed 8-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PADDB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_add_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Add(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Add packed double-precision (64-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>ADDPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_add_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.Add(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Add the lower double-precision (64-bit) floating-point element in "a" and "b", store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>ADDSD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_add_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.AddScalar(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Add packed signed 16-bit integers in "a" and "b" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PADDSW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_adds_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.AddSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Add packed signed 8-bit integers in "a" and "b" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PADDSB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <param name="b"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_adds_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.AddSaturate(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Add packed unsigned 16-bit integers in "a" and "b" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PADDUSW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_adds_epu16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.AddSaturate(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Add packed unsigned 8-bit integers in "a" and "b" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PADDUSB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_adds_epu8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.AddSaturate(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Compute the bitwise AND of packed double-precision (64-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>ANDPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_and_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.And(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise AND of 128 bits (representing integer data) in "a" and "b", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>PAND xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="b"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_and_si128(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.And(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Compute the bitwise NOT of packed double-precision (64-bit) floating-point elements in "a" and then AND with "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>ANDNPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_andnot_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.AndNot(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise NOT of 128 bits (representing integer data) in "a" and then AND with "b", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>PANDN xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="b"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_andnot_si128(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.AndNot(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Average packed unsigned 16-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PAVGW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_avg_epu16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Average(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Average packed unsigned 8-bit integers in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PAVGB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_avg_epu8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Average(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Shift "a" left by "imm8" bytes while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSLLDQ xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_bslli_si128(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShiftLeftLogical128BitLane(a.SI8, (byte)imm8);
-
-		/// <summary>
-		/// Shift "a" right by "imm8" bytes while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSRLDQ xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_bsrli_si128(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShiftRightLogical128BitLane(a.SI8, (byte)imm8);
-
-		/// <summary>
-		/// Compare packed 16-bit integers in "a" and "b" for equality, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PCMPEQW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_cmpeq_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.CompareEqual(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Compare packed 32-bit integers in "a" and "b" for equality, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PCMPEQD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="b"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_cmpeq_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.CompareEqual(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Compare packed 8-bit integers in "a" and "b" for equality, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PCMPEQB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_cmpeq_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.CompareEqual(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" for equality, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpeq_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" for equality, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpeq_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" for greater-than-or-equal, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpge_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareGreaterThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" for greater-than-or-equal, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpge_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarGreaterThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed signed 16-bit integers in "a" and "b" for greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PCMPGTW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_cmpgt_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.CompareGreaterThan(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Compare packed signed 32-bit integers in "a" and "b" for greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PCMPGTD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="b"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_cmpgt_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.CompareGreaterThan(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Compare packed signed 8-bit integers in "a" and "b" for greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PCMPGTB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <param name="b"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_cmpgt_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.CompareGreaterThan(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" for greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpgt_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareGreaterThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" for greater-than, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpgt_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarGreaterThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" for less-than-or-equal, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmple_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareLessThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" for less-than-or-equal, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmple_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarLessThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed signed 16-bit integers in "a" and "b" for less-than, and store the results in "dst". Note: This intrinsic emits the pcmpgtw instruction with the order of the operands switched.
-		/// </summary>
-		/// <remarks><c>PCMPGTW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_cmplt_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.CompareLessThan(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Compare packed signed 32-bit integers in "a" and "b" for less-than, and store the results in "dst". Note: This intrinsic emits the pcmpgtd instruction with the order of the operands switched.
-		/// </summary>
-		/// <remarks><c>PCMPGTD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="b"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_cmplt_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.CompareLessThan(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Compare packed signed 8-bit integers in "a" and "b" for less-than, and store the results in "dst". Note: This intrinsic emits the pcmpgtb instruction with the order of the operands switched.
-		/// </summary>
-		/// <remarks><c>PCMPGTB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <param name="b"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_cmplt_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.CompareLessThan(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" for less-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmplt_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareLessThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" for less-than, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmplt_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarLessThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" for not-equal, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpneq_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareNotEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" for not-equal, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpneq_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarNotEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" for not-greater-than-or-equal, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpnge_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareNotGreaterThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" for not-greater-than-or-equal, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpnge_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarNotGreaterThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" for not-greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpngt_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareNotGreaterThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" for not-greater-than, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpngt_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarNotGreaterThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" for not-less-than-or-equal, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpnle_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareNotLessThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" for not-less-than-or-equal, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpnle_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarNotLessThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" for not-less-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpnlt_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareNotLessThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" for not-less-than, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpnlt_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarNotLessThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" to see if neither is NaN, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpord_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareOrdered(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" to see if neither is NaN, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpord_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarOrdered(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b" to see if either is NaN, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CMPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpunord_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareUnordered(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b" to see if either is NaN, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CMPSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cmpunord_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarUnordered(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for equality, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comieq_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarOrderedEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for greater-than-or-equal, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comige_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarOrderedGreaterThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for greater-than, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comigt_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarOrderedGreaterThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for less-than-or-equal, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comile_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarOrderedLessThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for less-than, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comilt_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarOrderedLessThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for not-equal, and return the boolean result (0 or 1).
-		/// </summary>
-		/// <remarks><c>COMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_comineq_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarOrderedNotEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Convert packed signed 32-bit integers in "a" to packed double-precision (64-bit) floating-point elements, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CVTDQ2PD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cvtepi32_pd(__m128i a) => System.Runtime.Intrinsics.X86.Sse2.ConvertToVector128Double(a.SI32);
-
-		/// <summary>
-		/// Convert packed signed 32-bit integers in "a" to packed single-precision (32-bit) floating-point elements, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CVTDQ2PS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cvtepi32_ps(__m128i a) => System.Runtime.Intrinsics.X86.Sse2.ConvertToVector128Single(a.SI32);
-
-		/// <summary>
-		/// Convert packed double-precision (64-bit) floating-point elements in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CVTPD2DQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_cvtpd_epi32(__m128d a) => System.Runtime.Intrinsics.X86.Sse2.ConvertToVector128Int32(a.FP64);
-
-		/// <summary>
-		/// Convert packed double-precision (64-bit) floating-point elements in "a" to packed single-precision (32-bit) floating-point elements, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CVTPD2PS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cvtpd_ps(__m128d a) => System.Runtime.Intrinsics.X86.Sse2.ConvertToVector128Single(a.FP64);
-
-		/// <summary>
-		/// Convert packed single-precision (32-bit) floating-point elements in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CVTPS2DQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_cvtps_epi32(__m128 a) => System.Runtime.Intrinsics.X86.Sse2.ConvertToVector128Int32(a.FP32);
-
-		/// <summary>
-		/// Convert packed single-precision (32-bit) floating-point elements in "a" to packed double-precision (64-bit) floating-point elements, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CVTPS2PD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cvtps_pd(__m128 a) => System.Runtime.Intrinsics.X86.Sse2.ConvertToVector128Double(a.FP32);
-
-		/// <summary>
-		/// Convert the lower double-precision (64-bit) floating-point element in "a" to a 32-bit integer, and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>CVTSD2SI r32, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm_cvtsd_si32(__m128d a) => System.Runtime.Intrinsics.X86.Sse2.ConvertToInt32(a.FP64);
-
-		/// <summary>
-		/// Convert the lower double-precision (64-bit) floating-point element in "a" to a 64-bit integer, and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>CVTSD2SI r64, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>long dst {UI64}</c></returns>
-		public static long _mm_cvtsd_si64(__m128d a) => System.Runtime.Intrinsics.X86.Sse2.X64.ConvertToInt64(a.FP64);
-
-		/// <summary>
-		/// Convert the lower double-precision (64-bit) floating-point element in "b" to a single-precision (32-bit) floating-point element, store the result in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>CVTSD2SS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_cvtsd_ss(__m128 a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.ConvertScalarToVector128Single(a.FP32, b.FP64);
-
-		/// <summary>
-		/// Copy the lower 32-bit integer in "a" to "dst".
-		/// </summary>
-		/// <remarks><c>MOVD r32, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm_cvtsi128_si32(__m128i a) => (int)System.Runtime.Intrinsics.X86.Sse2.ConvertToUInt32(a.UI32);
-
-		/// <summary>
-		/// Copy the lower 64-bit integer in "a" to "dst".
-		/// </summary>
-		/// <remarks><c>MOVQ r64, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <returns><c>long dst {UI64}</c></returns>
-		public static long _mm_cvtsi128_si64(__m128i a) => (long)System.Runtime.Intrinsics.X86.Sse2.X64.ConvertToUInt64(a.UI64);
-
-		/// <summary>
-		/// Convert the signed 32-bit integer "b" to a double-precision (64-bit) floating-point element, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CVTSI2SD xmm, r32</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>int {SI32}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cvtsi32_sd(__m128d a, int b) => System.Runtime.Intrinsics.X86.Sse2.ConvertScalarToVector128Double(a.FP64, b);
-
-		/// <summary>
-		/// Copy 32-bit integer "a" to the lower elements of "dst", and zero the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>MOVD xmm, r32</c></remarks>
-		/// <param name="a"><c>int {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_cvtsi32_si128(int a) => System.Runtime.Intrinsics.X86.Sse2.ConvertScalarToVector128UInt32((uint)a);
-
-		/// <summary>
-		/// Convert the signed 64-bit integer "b" to a double-precision (64-bit) floating-point element, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CVTSI2SD xmm, r64</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>long {SI64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cvtsi64_sd(__m128d a, long b) => System.Runtime.Intrinsics.X86.Sse2.X64.ConvertScalarToVector128Double(a.FP64, b);
-
-		/// <summary>
-		/// Copy 64-bit integer "a" to the lower element of "dst", and zero the upper element.
-		/// </summary>
-		/// <remarks><c>MOVQ xmm, r64</c></remarks>
-		/// <param name="a"><c>long {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_cvtsi64_si128(long a) => System.Runtime.Intrinsics.X86.Sse2.X64.ConvertScalarToVector128UInt64((ulong)a);
-
-		/// <summary>
-		/// Convert the lower single-precision (32-bit) floating-point element in "b" to a double-precision (64-bit) floating-point element, store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>CVTSS2SD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_cvtss_sd(__m128d a, __m128 b) => System.Runtime.Intrinsics.X86.Sse2.ConvertScalarToVector128Double(a.FP64, b.FP32);
-
-		/// <summary>
-		/// Convert packed double-precision (64-bit) floating-point elements in "a" to packed 32-bit integers with truncation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CVTTPD2DQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_cvttpd_epi32(__m128d a) => System.Runtime.Intrinsics.X86.Sse2.ConvertToVector128Int32WithTruncation(a.FP64);
-
-		/// <summary>
-		/// Convert packed single-precision (32-bit) floating-point elements in "a" to packed 32-bit integers with truncation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>CVTTPS2DQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_cvttps_epi32(__m128 a) => System.Runtime.Intrinsics.X86.Sse2.ConvertToVector128Int32WithTruncation(a.FP32);
-
-		/// <summary>
-		/// Convert the lower double-precision (64-bit) floating-point element in "a" to a 32-bit integer with truncation, and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>CVTTSD2SI r32, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm_cvttsd_si32(__m128d a) => System.Runtime.Intrinsics.X86.Sse2.ConvertToInt32WithTruncation(a.FP64);
-
-		/// <summary>
-		/// Convert the lower double-precision (64-bit) floating-point element in "a" to a 64-bit integer with truncation, and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>CVTTSD2SI r64, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>long dst {UI64}</c></returns>
-		public static long _mm_cvttsd_si64(__m128d a) => System.Runtime.Intrinsics.X86.Sse2.X64.ConvertToInt64WithTruncation(a.FP64);
-
-		/// <summary>
-		/// Divide packed double-precision (64-bit) floating-point elements in "a" by packed elements in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>DIVPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_div_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.Divide(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Divide the lower double-precision (64-bit) floating-point element in "a" by the lower double-precision (64-bit) floating-point element in "b", store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>DIVSD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_div_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.DivideScalar(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Extract a 16-bit integer from "a", selected with "imm8", and store the result in the lower element of "dst".
-		/// </summary>
-		/// <remarks><c>PEXTRW r32, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>int dst {UI16}</c></returns>
-		public static int _mm_extract_epi16(__m128i a, int imm8) => (int)System.Runtime.Intrinsics.X86.Sse2.Extract(a.UI16, (byte)imm8);
-
-		/// <summary>
-		/// Copy "a" to "dst", and insert the 16-bit integer "i" into "dst" at the location specified by "imm8".
-		/// </summary>
-		/// <remarks><c>PINSRW xmm, r32, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="i"><c>int {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_insert_epi16(__m128i a, int i, int imm8) => System.Runtime.Intrinsics.X86.Sse2.Insert(a.UI16, (ushort)i, (byte)imm8);
-
-		/// <summary>
-		/// Perform a serializing operation on all load-from-memory instructions that were issued prior to this instruction. Guarantees that every load instruction that precedes, in program order, is globally visible before any load instruction which follows the fence in program order.
-		/// </summary>
-		/// <remarks><c>LFENCE </c></remarks>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_lfence() => System.Runtime.Intrinsics.X86.Sse2.LoadFence();
-
-		/// <summary>
-		/// Load 128-bits (composed of 2 packed double-precision (64-bit) floating-point elements) from memory into "dst".	"mem_addr" must be aligned on a 16-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>MOVAPD xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_load_pd(double* mem_addr) => System.Runtime.Intrinsics.X86.Sse2.LoadAlignedVector128(mem_addr);
-
-		/// <summary>
-		/// Load a double-precision (64-bit) floating-point element from memory into the lower of "dst", and zero the upper element. "mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVSD xmm, m64</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_load_sd(double* mem_addr) => System.Runtime.Intrinsics.X86.Sse2.LoadScalarVector128(mem_addr);
-
-		/// <summary>
-		/// Load 128-bits of integer data from memory into "dst". 	"mem_addr" must be aligned on a 16-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>MOVDQA xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_load_si128(__m128i* mem_addr) => System.Runtime.Intrinsics.X86.Sse2.LoadAlignedVector128((sbyte*)mem_addr);
-
-		/// <summary>
-		/// Load a double-precision (64-bit) floating-point element from memory into the upper element of "dst", and copy the lower element from "a" to "dst". "mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVHPD xmm, m64</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_loadh_pd(__m128d a, double* mem_addr) => System.Runtime.Intrinsics.X86.Sse2.LoadHigh(a.FP64, mem_addr);
-
-		/// <summary>
-		/// Load 64-bit integer from memory into the first element of "dst".
-		/// </summary>
-		/// <remarks><c>MOVQ xmm, m64</c></remarks>
-		/// <param name="mem_addr"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_loadl_epi64(__m128i* mem_addr) => System.Runtime.Intrinsics.X86.Sse2.LoadScalarVector128((long*)mem_addr);
-
-		/// <summary>
-		/// Load a double-precision (64-bit) floating-point element from memory into the lower element of "dst", and copy the upper element from "a" to "dst". "mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVLPD xmm, m64</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_loadl_pd(__m128d a, double* mem_addr) => System.Runtime.Intrinsics.X86.Sse2.LoadLow(a.FP64, mem_addr);
-
-		/// <summary>
-		/// Load 128-bits (composed of 2 packed double-precision (64-bit) floating-point elements) from memory into "dst".	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVUPD xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_loadu_pd(double* mem_addr) => System.Runtime.Intrinsics.X86.Sse2.LoadVector128(mem_addr);
-
-		/// <summary>
-		/// Load 128-bits of integer data from memory into "dst".	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVDQU xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_loadu_si128(__m128i* mem_addr) => System.Runtime.Intrinsics.X86.Sse2.LoadVector128((sbyte*)mem_addr);
-
-		/// <summary>
-		/// Load unaligned 32-bit integer from memory into the first element of "dst".
-		/// </summary>
-		/// <remarks><c>MOVD xmm, m32</c></remarks>
-		/// <param name="mem_addr"><c>void {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_loadu_si32(void* mem_addr) => System.Runtime.Intrinsics.X86.Sse2.LoadScalarVector128((int*)mem_addr);
-
-		/// <summary>
-		/// Multiply packed signed 16-bit integers in "a" and "b", producing intermediate signed 32-bit integers. Horizontally add adjacent pairs of intermediate 32-bit integers, and pack the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMADDWD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {SI32}</c></returns>
-		public static __m128i _mm_madd_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.MultiplyAddAdjacent(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Conditionally store 8-bit integer elements from "a" into memory using "mask" (elements are not stored when the highest bit is not set in the corresponding element) and a non-temporal memory hint. "mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MASKMOVDQU xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="mask"><c>__m128i {UI8}</c></param>
-		/// <param name="mem_addr"><c>byte {UI8}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_maskmoveu_si128(__m128i a, __m128i mask, byte* mem_addr) => System.Runtime.Intrinsics.X86.Sse2.MaskMove(a.UI8, mask.UI8, mem_addr);
-
-		/// <summary>
-		/// Compare packed signed 16-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMAXSW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_max_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Max(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Compare packed unsigned 8-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMAXUB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_max_epu8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Max(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>MAXPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_max_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.Max(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b", store the maximum value in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>MAXSD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_max_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.MaxScalar(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Perform a serializing operation on all load-from-memory and store-to-memory instructions that were issued prior to this instruction. Guarantees that every memory access that precedes, in program order, the memory fence instruction is globally visible before any memory instruction which follows the fence in program order.
-		/// </summary>
-		/// <remarks><c>MFENCE </c></remarks>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_mfence() => System.Runtime.Intrinsics.X86.Sse2.MemoryFence();
-
-		/// <summary>
-		/// Compare packed signed 16-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMINSW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_min_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Min(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Compare packed unsigned 8-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMINUB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_min_epu8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Min(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Compare packed double-precision (64-bit) floating-point elements in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>MINPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_min_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.Min(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point elements in "a" and "b", store the minimum value in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>MINSD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_min_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.MinScalar(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Copy the lower 64-bit integer in "a" to the lower element of "dst", and zero the upper element.
-		/// </summary>
-		/// <remarks><c>MOVQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_move_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Sse2.MoveScalar(a.UI64);
-
-		/// <summary>
-		/// Move the lower double-precision (64-bit) floating-point element from "b" to the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>MOVSD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_move_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.MoveScalar(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Create mask from the most significant bit of each 8-bit element in "a", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVMSKB r32, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <returns><c>int dst {MASK}</c></returns>
-		public static int _mm_movemask_epi8(__m128i a) => System.Runtime.Intrinsics.X86.Sse2.MoveMask(a.UI8);
-
-		/// <summary>
-		/// Set each bit of mask "dst" based on the most significant bit of the corresponding packed double-precision (64-bit) floating-point element in "a".
-		/// </summary>
-		/// <remarks><c>MOVMSKPD r32, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>int dst {MASK}</c></returns>
-		public static int _mm_movemask_pd(__m128d a) => System.Runtime.Intrinsics.X86.Sse2.MoveMask(a.FP64);
-
-		/// <summary>
-		/// Multiply the low unsigned 32-bit integers from each packed 64-bit element in "a" and "b", and store the unsigned 64-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>PMULUDQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="b"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_mul_epu32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Multiply(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Multiply packed double-precision (64-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>MULPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_mul_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.Multiply(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Multiply the lower double-precision (64-bit) floating-point element in "a" and "b", store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>MULSD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_mul_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.MultiplyScalar(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Multiply the packed signed 16-bit integers in "a" and "b", producing intermediate 32-bit integers, and store the high 16 bits of the intermediate integers in "dst".
-		/// </summary>
-		/// <remarks><c>PMULHW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_mulhi_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.MultiplyHigh(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Multiply the packed unsigned 16-bit integers in "a" and "b", producing intermediate 32-bit integers, and store the high 16 bits of the intermediate integers in "dst".
-		/// </summary>
-		/// <remarks><c>PMULHUW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_mulhi_epu16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.MultiplyHigh(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Multiply the packed 16-bit integers in "a" and "b", producing intermediate 32-bit integers, and store the low 16 bits of the intermediate integers in "dst".
-		/// </summary>
-		/// <remarks><c>PMULLW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_mullo_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.MultiplyLow(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Compute the bitwise OR of packed double-precision (64-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>ORPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_or_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.Or(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise OR of 128 bits (representing integer data) in "a" and "b", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>POR xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="b"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_or_si128(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Or(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Convert packed signed 16-bit integers from "a" and "b" to packed 8-bit integers using signed saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PACKSSWB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {SI8}</c></returns>
-		public static __m128i _mm_packs_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.PackSignedSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Convert packed signed 32-bit integers from "a" and "b" to packed 16-bit integers using signed saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PACKSSDW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="b"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {SI16}</c></returns>
-		public static __m128i _mm_packs_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.PackSignedSaturate(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Convert packed signed 16-bit integers from "a" and "b" to packed 8-bit integers using unsigned saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PACKUSWB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_packus_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.PackUnsignedSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Compute the absolute differences of packed unsigned 8-bit integers in "a" and "b", then horizontally sum each consecutive 8 differences to produce two unsigned 16-bit integers, and pack these unsigned 16-bit integers in the low 16 bits of 64-bit elements in "dst".
-		/// </summary>
-		/// <remarks><c>PSADBW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_sad_epu8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.SumAbsoluteDifferences(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Broadcast 16-bit integer "a" to all all elements of "dst". This intrinsic may generate "vpbroadcastw".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>short {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_set1_epi16(short a) => System.Runtime.Intrinsics.Vector128.Create((ushort)a);
-
-		/// <summary>
-		/// Broadcast 32-bit integer "a" to all elements of "dst". This intrinsic may generate "vpbroadcastd".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>int {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_set1_epi32(int a) => System.Runtime.Intrinsics.Vector128.Create((uint)a);
-
-		/// <summary>
-		/// Broadcast 64-bit integer "a" to all elements of "dst". This intrinsic may generate the "vpbroadcastq".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>long {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_set1_epi64x(long a) => System.Runtime.Intrinsics.Vector128.Create((ulong)a);
-
-		/// <summary>
-		/// Broadcast 8-bit integer "a" to all elements of "dst". This intrinsic may generate "vpbroadcastb".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>byte {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_set1_epi8(byte a) => System.Runtime.Intrinsics.Vector128.Create(a);
-
-		/// <summary>
-		/// Broadcast double-precision (64-bit) floating-point value "a" to all elements of "dst".
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="a"><c>double {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_set1_pd(double a) => System.Runtime.Intrinsics.Vector128.Create(a);
-
-		/// <summary>
-		/// Set packed 16-bit integers in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e7"><c>short {UI16}</c></param>
-		/// <param name="e6"><c>short {UI16}</c></param>
-		/// <param name="e5"><c>short {UI16}</c></param>
-		/// <param name="e4"><c>short {UI16}</c></param>
-		/// <param name="e3"><c>short {UI16}</c></param>
-		/// <param name="e2"><c>short {UI16}</c></param>
-		/// <param name="e1"><c>short {UI16}</c></param>
-		/// <param name="e0"><c>short {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_setr_epi16(short e7, short e6, short e5, short e4, short e3, short e2, short e1, short e0) => System.Runtime.Intrinsics.Vector128.Create((ushort)e7, (ushort)e6, (ushort)e5, (ushort)e4, (ushort)e3, (ushort)e2, (ushort)e1, (ushort)e0);
-
-		/// <summary>
-		/// Set packed 32-bit integers in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e3"><c>int {UI32}</c></param>
-		/// <param name="e2"><c>int {UI32}</c></param>
-		/// <param name="e1"><c>int {UI32}</c></param>
-		/// <param name="e0"><c>int {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_setr_epi32(int e3, int e2, int e1, int e0) => System.Runtime.Intrinsics.Vector128.Create((uint)e3, (uint)e2, (uint)e1, (uint)e0);
-
-		/// <summary>
-		/// Set packed 64-bit integers in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e1"><c>__m64 {UI64}</c></param>
-		/// <param name="e0"><c>__m64 {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_setr_epi64(__m64 e1, __m64 e0) => System.Runtime.Intrinsics.Vector128.Create(e1.SI32, e0.SI32);
-
-		/// <summary>
-		/// Set packed 8-bit integers in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e15"><c>byte {UI8}</c></param>
-		/// <param name="e14"><c>byte {UI8}</c></param>
-		/// <param name="e13"><c>byte {UI8}</c></param>
-		/// <param name="e12"><c>byte {UI8}</c></param>
-		/// <param name="e11"><c>byte {UI8}</c></param>
-		/// <param name="e10"><c>byte {UI8}</c></param>
-		/// <param name="e9"><c>byte {UI8}</c></param>
-		/// <param name="e8"><c>byte {UI8}</c></param>
-		/// <param name="e7"><c>byte {UI8}</c></param>
-		/// <param name="e6"><c>byte {UI8}</c></param>
-		/// <param name="e5"><c>byte {UI8}</c></param>
-		/// <param name="e4"><c>byte {UI8}</c></param>
-		/// <param name="e3"><c>byte {UI8}</c></param>
-		/// <param name="e2"><c>byte {UI8}</c></param>
-		/// <param name="e1"><c>byte {UI8}</c></param>
-		/// <param name="e0"><c>byte {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_setr_epi8(byte e15, byte e14, byte e13, byte e12, byte e11, byte e10, byte e9, byte e8, byte e7, byte e6, byte e5, byte e4, byte e3, byte e2, byte e1, byte e0) => System.Runtime.Intrinsics.Vector128.Create(e15, e14, e13, e12, e11, e10, e9, e8, e7, e6, e5, e4, e3, e2, e1, e0);
-
-		/// <summary>
-		/// Set packed double-precision (64-bit) floating-point elements in "dst" with the supplied values in reverse order.
-		/// </summary>
-		/// <remarks><c></c></remarks>
-		/// <param name="e1"><c>double {FP64}</c></param>
-		/// <param name="e0"><c>double {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_setr_pd(double e1, double e0) => System.Runtime.Intrinsics.Vector128.Create(e1, e0);
-
-		/// <summary>
-		/// Shuffle 32-bit integers in "a" using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSHUFD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_shuffle_epi32(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.Shuffle(a.UI32, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle double-precision (64-bit) floating-point elements using the control in "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>SHUFPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_shuffle_pd(__m128d a, __m128d b, int imm8) => System.Runtime.Intrinsics.X86.Sse2.Shuffle(a.FP64, b.FP64, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle 16-bit integers in the high 64 bits of "a" using the control in "imm8". Store the results in the high 64 bits of "dst", with the low 64 bits being copied from from "a" to "dst".
-		/// </summary>
-		/// <remarks><c>PSHUFHW xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_shufflehi_epi16(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShuffleHigh(a.UI16, (byte)imm8);
-
-		/// <summary>
-		/// Shuffle 16-bit integers in the low 64 bits of "a" using the control in "imm8". Store the results in the low 64 bits of "dst", with the high 64 bits being copied from from "a" to "dst".
-		/// </summary>
-		/// <remarks><c>PSHUFLW xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_shufflelo_epi16(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShuffleLow(a.UI16, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 16-bit integers in "a" left by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSLLW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="count"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_sll_epi16(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Sse2.ShiftLeftLogical(a.UI16, count.UI16);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" left by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSLLD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="count"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_sll_epi32(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Sse2.ShiftLeftLogical(a.UI32, count.UI32);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" left by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSLLQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="count"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_sll_epi64(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Sse2.ShiftLeftLogical(a.UI64, count.UI64);
-
-		/// <summary>
-		/// Shift packed 16-bit integers in "a" left by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSLLW xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_slli_epi16(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShiftLeftLogical(a.UI16, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" left by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSLLD xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_slli_epi32(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShiftLeftLogical(a.UI32, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" left by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSLLQ xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_slli_epi64(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShiftLeftLogical(a.UI64, (byte)imm8);
-
-		/// <summary>
-		/// Compute the square root of packed double-precision (64-bit) floating-point elements in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>SQRTPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_sqrt_pd(__m128d a) => System.Runtime.Intrinsics.X86.Sse2.Sqrt(a.FP64);
-
-		/// <summary>
-		/// Compute the square root of the lower double-precision (64-bit) floating-point element in "b", store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>SQRTSD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_sqrt_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.SqrtScalar(a.FP64);
-
-		/// <summary>
-		/// Shift packed 16-bit integers in "a" right by "count" while shifting in sign bits, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSRAW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="count"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_sra_epi16(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Sse2.ShiftRightArithmetic(a.SI16, count.SI16);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" right by "count" while shifting in sign bits, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSRAD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="count"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_sra_epi32(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Sse2.ShiftRightArithmetic(a.SI32, count.SI32);
-
-		/// <summary>
-		/// Shift packed 16-bit integers in "a" right by "imm8" while shifting in sign bits, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSRAW xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_srai_epi16(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShiftRightArithmetic(a.SI16, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" right by "imm8" while shifting in sign bits, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSRAD xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_srai_epi32(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShiftRightArithmetic(a.SI32, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 16-bit integers in "a" right by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSRLW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="count"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_srl_epi16(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Sse2.ShiftRightLogical(a.UI16, count.UI16);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" right by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSRLD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="count"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_srl_epi32(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Sse2.ShiftRightLogical(a.UI32, count.UI32);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" right by "count" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSRLQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="count"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_srl_epi64(__m128i a, __m128i count) => System.Runtime.Intrinsics.X86.Sse2.ShiftRightLogical(a.UI64, count.UI64);
-
-		/// <summary>
-		/// Shift packed 16-bit integers in "a" right by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSRLW xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_srli_epi16(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShiftRightLogical(a.UI16, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 32-bit integers in "a" right by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSRLD xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_srli_epi32(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShiftRightLogical(a.UI32, (byte)imm8);
-
-		/// <summary>
-		/// Shift packed 64-bit integers in "a" right by "imm8" while shifting in zeros, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSRLQ xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_srli_epi64(__m128i a, int imm8) => System.Runtime.Intrinsics.X86.Sse2.ShiftRightLogical(a.UI64, (byte)imm8);
-
-		/// <summary>
-		/// Store 128-bits (composed of 2 packed double-precision (64-bit) floating-point elements) from "a" into memory.	"mem_addr" must be aligned on a 16-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>MOVAPD m128, xmm</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_store_pd(double* mem_addr, __m128d a) => System.Runtime.Intrinsics.X86.Sse2.StoreAligned(mem_addr, a.FP64);
-
-		/// <summary>
-		/// Store the lower double-precision (64-bit) floating-point element from "a" into memory. "mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVSD m64, xmm</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_store_sd(double* mem_addr, __m128d a) => System.Runtime.Intrinsics.X86.Sse2.StoreScalar(mem_addr, a.FP64);
-
-		/// <summary>
-		/// Store 128-bits of integer data from "a" into memory. 	"mem_addr" must be aligned on a 16-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>MOVDQA m128, xmm</c></remarks>
-		/// <param name="mem_addr"><c>__m128i {M128}</c></param>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_store_si128(__m128i* mem_addr, __m128i a) => System.Runtime.Intrinsics.X86.Sse2.StoreAligned((sbyte*)mem_addr, a.SI8);
-
-		/// <summary>
-		/// Store the upper double-precision (64-bit) floating-point element from "a" into memory.
-		/// </summary>
-		/// <remarks><c>MOVHPD m64, xmm</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_storeh_pd(double* mem_addr, __m128d a) => System.Runtime.Intrinsics.X86.Sse2.StoreHigh(mem_addr, a.FP64);
-
-		/// <summary>
-		/// Store 64-bit integer from the first element of "a" into memory.
-		/// </summary>
-		/// <remarks><c>MOVQ m64, xmm</c></remarks>
-		/// <param name="mem_addr"><c>__m128i {UI64}</c></param>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_storel_epi64(__m128i* mem_addr, __m128i a) => System.Runtime.Intrinsics.X86.Sse2.StoreScalar((long*)mem_addr, a.SI64);
-
-		/// <summary>
-		/// Store the lower double-precision (64-bit) floating-point element from "a" into memory.
-		/// </summary>
-		/// <remarks><c>MOVLPD m64, xmm</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_storel_pd(double* mem_addr, __m128d a) => System.Runtime.Intrinsics.X86.Sse2.StoreLow(mem_addr, a.FP64);
-
-		/// <summary>
-		/// Store 128-bits (composed of 2 packed double-precision (64-bit) floating-point elements) from "a" into memory.	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVUPD m128, xmm</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_storeu_pd(double* mem_addr, __m128d a) => System.Runtime.Intrinsics.X86.Sse2.Store(mem_addr, a.FP64);
-
-		/// <summary>
-		/// Store 128-bits of integer data from "a" into memory.	"mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVDQU m128, xmm</c></remarks>
-		/// <param name="mem_addr"><c>__m128i {M128}</c></param>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_storeu_si128(__m128i* mem_addr, __m128i a) => System.Runtime.Intrinsics.X86.Sse2.Store((sbyte*)mem_addr, a.SI8);
-
-		/// <summary>
-		/// Store 32-bit integer from the first element of "a" into memory. "mem_addr" does not need to be aligned on any particular boundary.
-		/// </summary>
-		/// <remarks><c>MOVD m32, xmm</c></remarks>
-		/// <param name="mem_addr"><c>void {UI32}</c></param>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_storeu_si32(void* mem_addr, __m128i a) => System.Runtime.Intrinsics.X86.Sse2.StoreScalar((int*)mem_addr, a.SI32);
-
-		/// <summary>
-		/// Store 128-bits (composed of 2 packed double-precision (64-bit) floating-point elements) from "a" into memory using a non-temporal memory hint.	"mem_addr" must be aligned on a 16-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>MOVNTPD m128, xmm</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_stream_pd(double* mem_addr, __m128d a) => System.Runtime.Intrinsics.X86.Sse2.StoreAlignedNonTemporal(mem_addr, a.FP64);
-
-		/// <summary>
-		/// Store 128-bits of integer data from "a" into memory using a non-temporal memory hint. 	"mem_addr" must be aligned on a 16-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>MOVNTDQ m128, xmm</c></remarks>
-		/// <param name="mem_addr"><c>__m128i {M128}</c></param>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_stream_si128(__m128i* mem_addr, __m128i a) => System.Runtime.Intrinsics.X86.Sse2.StoreAlignedNonTemporal((sbyte*)mem_addr, a.SI8);
-
-		/// <summary>
-		/// Store 32-bit integer "a" into memory using a non-temporal hint to minimize cache pollution. If the cache line containing address "mem_addr" is already in the cache, the cache will be updated.
-		/// </summary>
-		/// <remarks><c>MOVNTI m32, r32</c></remarks>
-		/// <param name="mem_addr"><c>int {UI32}</c></param>
-		/// <param name="a"><c>int {UI32}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_stream_si32(int* mem_addr, int a) => System.Runtime.Intrinsics.X86.Sse2.StoreNonTemporal((uint*)mem_addr, (uint)a);
-
-		/// <summary>
-		/// Store 64-bit integer "a" into memory using a non-temporal hint to minimize cache pollution. If the cache line containing address "mem_addr" is already in the cache, the cache will be updated.
-		/// </summary>
-		/// <remarks><c>MOVNTI m64, r64</c></remarks>
-		/// <param name="mem_addr"><c>long {UI64}</c></param>
-		/// <param name="a"><c>long {UI64}</c></param>
-		/// <returns><c>void  {}</c></returns>
-		public static void _mm_stream_si64(long* mem_addr, long a) => System.Runtime.Intrinsics.X86.Sse2.X64.StoreNonTemporal((ulong*)mem_addr, (ulong)a);
-
-		/// <summary>
-		/// Subtract packed 16-bit integers in "b" from packed 16-bit integers in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSUBW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_sub_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Subtract(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Subtract packed 32-bit integers in "b" from packed 32-bit integers in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSUBD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="b"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_sub_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Subtract(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Subtract packed 64-bit integers in "b" from packed 64-bit integers in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSUBQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="b"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_sub_epi64(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Subtract(a.UI64, b.UI64);
-
-		/// <summary>
-		/// Subtract packed 8-bit integers in "b" from packed 8-bit integers in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSUBB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_sub_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Subtract(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Subtract packed double-precision (64-bit) floating-point elements in "b" from packed double-precision (64-bit) floating-point elements in "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>SUBPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_sub_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.Subtract(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Subtract the lower double-precision (64-bit) floating-point element in "b" from the lower double-precision (64-bit) floating-point element in "a", store the result in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>SUBSD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_sub_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.SubtractScalar(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Subtract packed signed 16-bit integers in "b" from packed 16-bit integers in "a" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSUBSW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_subs_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.SubtractSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Subtract packed signed 8-bit integers in "b" from packed 8-bit integers in "a" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSUBSB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <param name="b"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_subs_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.SubtractSaturate(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Subtract packed unsigned 16-bit integers in "b" from packed unsigned 16-bit integers in "a" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSUBUSW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_subs_epu16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.SubtractSaturate(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Subtract packed unsigned 8-bit integers in "b" from packed unsigned 8-bit integers in "a" using saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSUBUSB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_subs_epu8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.SubtractSaturate(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for equality, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomieq_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarUnorderedEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for greater-than-or-equal, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomige_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarUnorderedGreaterThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for greater-than, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomigt_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarUnorderedGreaterThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for less-than-or-equal, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomile_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarUnorderedLessThanOrEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for less-than, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomilt_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarUnorderedLessThan(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compare the lower double-precision (64-bit) floating-point element in "a" and "b" for not-equal, and return the boolean result (0 or 1). This instruction will not signal an exception for QNaNs.
-		/// </summary>
-		/// <remarks><c>UCOMISD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_ucomineq_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.CompareScalarUnorderedNotEqual(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Unpack and interleave 16-bit integers from the high half of "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PUNPCKHWD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_unpackhi_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.UnpackHigh(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Unpack and interleave 32-bit integers from the high half of "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PUNPCKHDQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="b"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_unpackhi_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.UnpackHigh(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Unpack and interleave 64-bit integers from the high half of "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PUNPCKHQDQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="b"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_unpackhi_epi64(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.UnpackHigh(a.UI64, b.UI64);
-
-		/// <summary>
-		/// Unpack and interleave 8-bit integers from the high half of "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PUNPCKHBW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_unpackhi_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.UnpackHigh(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Unpack and interleave double-precision (64-bit) floating-point elements from the high half of "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>UNPCKHPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_unpackhi_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.UnpackHigh(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Unpack and interleave 16-bit integers from the low half of "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PUNPCKLWD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_unpacklo_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.UnpackLow(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Unpack and interleave 32-bit integers from the low half of "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PUNPCKLDQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="b"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_unpacklo_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.UnpackLow(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Unpack and interleave 64-bit integers from the low half of "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PUNPCKLQDQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="b"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_unpacklo_epi64(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.UnpackLow(a.UI64, b.UI64);
-
-		/// <summary>
-		/// Unpack and interleave 8-bit integers from the low half of "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PUNPCKLBW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_unpacklo_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.UnpackLow(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Unpack and interleave double-precision (64-bit) floating-point elements from the low half of "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>UNPCKLPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_unpacklo_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.UnpackLow(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise XOR of packed double-precision (64-bit) floating-point elements in "a" and "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>XORPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_xor_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse2.Xor(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Compute the bitwise XOR of 128 bits (representing integer data) in "a" and "b", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>PXOR xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="b"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_xor_si128(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse2.Xor(a.UI8, b.UI8);
-
-	}
-}
diff --git a/src/External/RawIntrinsics/SSE3.cs b/src/External/RawIntrinsics/SSE3.cs
deleted file mode 100644
index de71b53..0000000
--- a/src/External/RawIntrinsics/SSE3.cs
+++ /dev/null
@@ -1,100 +0,0 @@
-namespace RawIntrinsics
-{
-	public static unsafe partial class SSE3
-	{
-		/// <summary>
-		/// Alternatively add and subtract packed double-precision (64-bit) floating-point elements in "a" to/from packed elements in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>ADDSUBPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_addsub_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse3.AddSubtract(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Alternatively add and subtract packed single-precision (32-bit) floating-point elements in "a" to/from packed elements in "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>ADDSUBPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_addsub_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse3.AddSubtract(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of double-precision (64-bit) floating-point elements in "a" and "b", and pack the results in "dst".
-		/// </summary>
-		/// <remarks><c>HADDPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_hadd_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse3.HorizontalAdd(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of single-precision (32-bit) floating-point elements in "a" and "b", and pack the results in "dst".
-		/// </summary>
-		/// <remarks><c>HADDPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_hadd_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse3.HorizontalAdd(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Horizontally subtract adjacent pairs of double-precision (64-bit) floating-point elements in "a" and "b", and pack the results in "dst".
-		/// </summary>
-		/// <remarks><c>HSUBPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_hsub_pd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse3.HorizontalSubtract(a.FP64, b.FP64);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of single-precision (32-bit) floating-point elements in "a" and "b", and pack the results in "dst".
-		/// </summary>
-		/// <remarks><c>HSUBPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_hsub_ps(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse3.HorizontalSubtract(a.FP32, b.FP32);
-
-		/// <summary>
-		/// Load 128-bits of integer data from unaligned memory into "dst". This intrinsic may perform better than "_mm_loadu_si128" when the data crosses a cache line boundary.
-		/// </summary>
-		/// <remarks><c>LDDQU xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_lddqu_si128(__m128i* mem_addr) => System.Runtime.Intrinsics.X86.Sse3.LoadDquVector128((sbyte*)mem_addr);
-
-		/// <summary>
-		/// Load a double-precision (64-bit) floating-point element from memory into both elements of "dst".
-		/// </summary>
-		/// <remarks><c>MOVDDUP xmm, m64</c></remarks>
-		/// <param name="mem_addr"><c>double {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_loaddup_pd(double* mem_addr) => System.Runtime.Intrinsics.X86.Sse3.LoadAndDuplicateToVector128(mem_addr);
-
-		/// <summary>
-		/// Duplicate the low double-precision (64-bit) floating-point element from "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>MOVDDUP xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_movedup_pd(__m128d a) => System.Runtime.Intrinsics.X86.Sse3.MoveAndDuplicate(a.FP64);
-
-		/// <summary>
-		/// Duplicate odd-indexed single-precision (32-bit) floating-point elements from "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>MOVSHDUP xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_movehdup_ps(__m128 a) => System.Runtime.Intrinsics.X86.Sse3.MoveHighAndDuplicate(a.FP32);
-
-		/// <summary>
-		/// Duplicate even-indexed single-precision (32-bit) floating-point elements from "a", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>MOVSLDUP xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_moveldup_ps(__m128 a) => System.Runtime.Intrinsics.X86.Sse3.MoveLowAndDuplicate(a.FP32);
-
-	}
-}
diff --git a/src/External/RawIntrinsics/SSE41.cs b/src/External/RawIntrinsics/SSE41.cs
deleted file mode 100644
index 105b0a8..0000000
--- a/src/External/RawIntrinsics/SSE41.cs
+++ /dev/null
@@ -1,525 +0,0 @@
-namespace RawIntrinsics
-{
-	public static unsafe partial class SSE41
-	{
-		/// <summary>
-		/// Blend packed 16-bit integers from "a" and "b" using control mask "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PBLENDW xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_blend_epi16(__m128i a, __m128i b, int imm8) => System.Runtime.Intrinsics.X86.Sse41.Blend(a.UI16, b.UI16, (byte)imm8);
-
-		/// <summary>
-		/// Blend packed double-precision (64-bit) floating-point elements from "a" and "b" using control mask "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>BLENDPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_blend_pd(__m128d a, __m128d b, int imm8) => System.Runtime.Intrinsics.X86.Sse41.Blend(a.FP64, b.FP64, (byte)imm8);
-
-		/// <summary>
-		/// Blend packed single-precision (32-bit) floating-point elements from "a" and "b" using control mask "imm8", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>BLENDPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_blend_ps(__m128 a, __m128 b, int imm8) => System.Runtime.Intrinsics.X86.Sse41.Blend(a.FP32, b.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Blend packed 8-bit integers from "a" and "b" using "mask", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PBLENDVB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <param name="mask"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_blendv_epi8(__m128i a, __m128i b, __m128i mask) => System.Runtime.Intrinsics.X86.Sse41.BlendVariable(a.UI8, b.UI8, mask.UI8);
-
-		/// <summary>
-		/// Blend packed double-precision (64-bit) floating-point elements from "a" and "b" using "mask", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>BLENDVPD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="mask"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_blendv_pd(__m128d a, __m128d b, __m128d mask) => System.Runtime.Intrinsics.X86.Sse41.BlendVariable(a.FP64, b.FP64, mask.FP64);
-
-		/// <summary>
-		/// Blend packed single-precision (32-bit) floating-point elements from "a" and "b" using "mask", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>BLENDVPS xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="mask"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_blendv_ps(__m128 a, __m128 b, __m128 mask) => System.Runtime.Intrinsics.X86.Sse41.BlendVariable(a.FP32, b.FP32, mask.FP32);
-
-		/// <summary>
-		/// Round the packed double-precision (64-bit) floating-point elements in "a" up to an integer value, and store the results as packed double-precision floating-point elements in "dst".
-		/// </summary>
-		/// <remarks><c>ROUNDPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_ceil_pd(__m128d a) => System.Runtime.Intrinsics.X86.Sse41.Ceiling(a.FP64);
-
-		/// <summary>
-		/// Round the packed single-precision (32-bit) floating-point elements in "a" up to an integer value, and store the results as packed single-precision floating-point elements in "dst".
-		/// </summary>
-		/// <remarks><c>ROUNDPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_ceil_ps(__m128 a) => System.Runtime.Intrinsics.X86.Sse41.Ceiling(a.FP32);
-
-		/// <summary>
-		/// Round the lower double-precision (64-bit) floating-point element in "b" up to an integer value, store the result as a double-precision floating-point element in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>ROUNDSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_ceil_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse41.CeilingScalar(a.FP64);
-
-		/// <summary>
-		/// Round the lower single-precision (32-bit) floating-point element in "b" up to an integer value, store the result as a single-precision floating-point element in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>ROUNDSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_ceil_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse41.CeilingScalar(a.FP32);
-
-		/// <summary>
-		/// Compare packed 64-bit integers in "a" and "b" for equality, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PCMPEQQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="b"><c>__m128i {UI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_cmpeq_epi64(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.CompareEqual(a.UI64, b.UI64);
-
-		/// <summary>
-		/// Sign extend packed 16-bit integers in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVSXWD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {SI32}</c></returns>
-		public static __m128i _mm_cvtepi16_epi32(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int32(a.SI16);
-
-		/// <summary>
-		/// Sign extend packed 16-bit integers in "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVSXWQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {SI64}</c></returns>
-		public static __m128i _mm_cvtepi16_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int64(a.SI16);
-
-		/// <summary>
-		/// Sign extend packed 32-bit integers in "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVSXDQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {SI64}</c></returns>
-		public static __m128i _mm_cvtepi32_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int64(a.SI32);
-
-		/// <summary>
-		/// Sign extend packed 8-bit integers in "a" to packed 16-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVSXBW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {SI16}</c></returns>
-		public static __m128i _mm_cvtepi8_epi16(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int16(a.SI8);
-
-		/// <summary>
-		/// Sign extend packed 8-bit integers in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVSXBD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {SI32}</c></returns>
-		public static __m128i _mm_cvtepi8_epi32(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int32(a.SI8);
-
-		/// <summary>
-		/// Sign extend packed 8-bit integers in the low 8 bytes of "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVSXBQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {SI64}</c></returns>
-		public static __m128i _mm_cvtepi8_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int64(a.SI8);
-
-		/// <summary>
-		/// Zero extend packed unsigned 16-bit integers in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVZXWD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_cvtepu16_epi32(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int32(a.UI16);
-
-		/// <summary>
-		/// Zero extend packed unsigned 16-bit integers in "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVZXWQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_cvtepu16_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int64(a.UI16);
-
-		/// <summary>
-		/// Zero extend packed unsigned 32-bit integers in "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVZXDQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_cvtepu32_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int64(a.UI32);
-
-		/// <summary>
-		/// Zero extend packed unsigned 8-bit integers in "a" to packed 16-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVZXBW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_cvtepu8_epi16(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int16(a.UI8);
-
-		/// <summary>
-		/// Zero extend packed unsigned 8-bit integers in "a" to packed 32-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVZXBD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_cvtepu8_epi32(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int32(a.UI8);
-
-		/// <summary>
-		/// Zero extend packed unsigned 8-bit integers in the low 8 byte sof "a" to packed 64-bit integers, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PMOVZXBQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_cvtepu8_epi64(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.ConvertToVector128Int64(a.UI8);
-
-		/// <summary>
-		/// Conditionally multiply the packed double-precision (64-bit) floating-point elements in "a" and "b" using the high 4 bits in "imm8", sum the four products, and conditionally store the sum in "dst" using the low 4 bits of "imm8".
-		/// </summary>
-		/// <remarks><c>DPPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_dp_pd(__m128d a, __m128d b, int imm8) => System.Runtime.Intrinsics.X86.Sse41.DotProduct(a.FP64, b.FP64, (byte)imm8);
-
-		/// <summary>
-		/// Conditionally multiply the packed single-precision (32-bit) floating-point elements in "a" and "b" using the high 4 bits in "imm8", sum the four products, and conditionally store the sum in "dst" using the low 4 bits of "imm8".
-		/// </summary>
-		/// <remarks><c>DPPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_dp_ps(__m128 a, __m128 b, int imm8) => System.Runtime.Intrinsics.X86.Sse41.DotProduct(a.FP32, b.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Extract a 32-bit integer from "a", selected with "imm8", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>PEXTRD r32, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm_extract_epi32(__m128i a, int imm8) => (int)System.Runtime.Intrinsics.X86.Sse41.Extract(a.UI32, (byte)imm8);
-
-		/// <summary>
-		/// Extract a 64-bit integer from "a", selected with "imm8", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>PEXTRQ r64, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>long dst {UI64}</c></returns>
-		public static long _mm_extract_epi64(__m128i a, int imm8) => (long)System.Runtime.Intrinsics.X86.Sse41.X64.Extract(a.UI64, (byte)imm8);
-
-		/// <summary>
-		/// Extract an 8-bit integer from "a", selected with "imm8", and store the result in the lower element of "dst".
-		/// </summary>
-		/// <remarks><c>PEXTRB r32, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>int dst {UI8}</c></returns>
-		public static int _mm_extract_epi8(__m128i a, int imm8) => (int)System.Runtime.Intrinsics.X86.Sse41.Extract(a.UI8, (byte)imm8);
-
-		/// <summary>
-		/// Extract a single-precision (32-bit) floating-point element from "a", selected with "imm8", and store the result in "dst".
-		/// </summary>
-		/// <remarks><c>EXTRACTPS r32, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>int dst {UI32}</c></returns>
-		public static int _mm_extract_ps(__m128 a, int imm8) => (int)System.Runtime.Intrinsics.X86.Sse41.Extract(a.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Round the packed double-precision (64-bit) floating-point elements in "a" down to an integer value, and store the results as packed double-precision floating-point elements in "dst".
-		/// </summary>
-		/// <remarks><c>ROUNDPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_floor_pd(__m128d a) => System.Runtime.Intrinsics.X86.Sse41.Floor(a.FP64);
-
-		/// <summary>
-		/// Round the packed single-precision (32-bit) floating-point elements in "a" down to an integer value, and store the results as packed single-precision floating-point elements in "dst".
-		/// </summary>
-		/// <remarks><c>ROUNDPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_floor_ps(__m128 a) => System.Runtime.Intrinsics.X86.Sse41.Floor(a.FP32);
-
-		/// <summary>
-		/// Round the lower double-precision (64-bit) floating-point element in "b" down to an integer value, store the result as a double-precision floating-point element in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".
-		/// </summary>
-		/// <remarks><c>ROUNDSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_floor_sd(__m128d a, __m128d b) => System.Runtime.Intrinsics.X86.Sse41.FloorScalar(a.FP64);
-
-		/// <summary>
-		/// Round the lower single-precision (32-bit) floating-point element in "b" down to an integer value, store the result as a single-precision floating-point element in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".
-		/// </summary>
-		/// <remarks><c>ROUNDSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_floor_ss(__m128 a, __m128 b) => System.Runtime.Intrinsics.X86.Sse41.FloorScalar(a.FP32);
-
-		/// <summary>
-		/// Copy "a" to "dst", and insert the 32-bit integer "i" into "dst" at the location specified by "imm8".
-		/// </summary>
-		/// <remarks><c>PINSRD xmm, r32, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="i"><c>int {UI32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_insert_epi32(__m128i a, int i, int imm8) => System.Runtime.Intrinsics.X86.Sse41.Insert(a.UI32, (uint)i, (byte)imm8);
-
-		/// <summary>
-		/// Copy "a" to "dst", and insert the 64-bit integer "i" into "dst" at the location specified by "imm8".
-		/// </summary>
-		/// <remarks><c>PINSRQ xmm, r64, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI64}</c></param>
-		/// <param name="i"><c>long {UI64}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_insert_epi64(__m128i a, long i, int imm8) => System.Runtime.Intrinsics.X86.Sse41.X64.Insert(a.UI64, (ulong)i, (byte)imm8);
-
-		/// <summary>
-		/// Copy "a" to "dst", and insert the lower 8-bit integer from "i" into "dst" at the location specified by "imm8".
-		/// </summary>
-		/// <remarks><c>PINSRB xmm, r32, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="i"><c>int {UI8}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_insert_epi8(__m128i a, int i, int imm8) => System.Runtime.Intrinsics.X86.Sse41.Insert(a.UI8, (byte)i, (byte)imm8);
-
-		/// <summary>
-		/// Copy "a" to "tmp", then insert a single-precision (32-bit) floating-point element from "b" into "tmp" using the control in "imm8". Store "tmp" to "dst" using the mask in "imm8" (elements are zeroed out when the corresponding bit is set).
-		/// </summary>
-		/// <remarks><c>INSERTPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_insert_ps(__m128 a, __m128 b, int imm8) => System.Runtime.Intrinsics.X86.Sse41.Insert(a.FP32, b.FP32, (byte)imm8);
-
-		/// <summary>
-		/// Compare packed signed 32-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMAXSD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="b"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_max_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.Max(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Compare packed signed 8-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMAXSB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <param name="b"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_max_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.Max(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Compare packed unsigned 16-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMAXUW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_max_epu16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.Max(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Compare packed unsigned 32-bit integers in "a" and "b", and store packed maximum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMAXUD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="b"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_max_epu32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.Max(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Compare packed signed 32-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMINSD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="b"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_min_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.Min(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Compare packed signed 8-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMINSB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <param name="b"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_min_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.Min(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Compare packed unsigned 16-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMINUW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <param name="b"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_min_epu16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.Min(a.UI16, b.UI16);
-
-		/// <summary>
-		/// Compare packed unsigned 32-bit integers in "a" and "b", and store packed minimum values in "dst".
-		/// </summary>
-		/// <remarks><c>PMINUD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="b"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_min_epu32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.Min(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Horizontally compute the minimum amongst the packed unsigned 16-bit integers in "a", store the minimum and index in "dst", and zero the remaining bits in "dst".
-		/// </summary>
-		/// <remarks><c>PHMINPOSUW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_minpos_epu16(__m128i a) => System.Runtime.Intrinsics.X86.Sse41.MinHorizontal(a.UI16);
-
-		/// <summary>
-		/// Compute the sum of absolute differences (SADs) of quadruplets of unsigned 8-bit integers in "a" compared to those in "b", and store the 16-bit results in "dst".	Eight SADs are performed using one quadruplet from "b" and eight quadruplets from "a". One quadruplet is selected from "b" starting at on the offset specified in "imm8". Eight quadruplets are formed from sequential 8-bit integers selected from "a" starting at the offset specified in "imm8".
-		/// </summary>
-		/// <remarks><c>MPSADBW xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_mpsadbw_epu8(__m128i a, __m128i b, int imm8) => System.Runtime.Intrinsics.X86.Sse41.MultipleSumAbsoluteDifferences(a.UI8, b.UI8, (byte)imm8);
-
-		/// <summary>
-		/// Multiply the low signed 32-bit integers from each packed 64-bit element in "a" and "b", and store the signed 64-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>PMULDQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="b"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {SI64}</c></returns>
-		public static __m128i _mm_mul_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.Multiply(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Multiply the packed 32-bit integers in "a" and "b", producing intermediate 64-bit integers, and store the low 32 bits of the intermediate integers in "dst".
-		/// </summary>
-		/// <remarks><c>PMULLD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI32}</c></param>
-		/// <param name="b"><c>__m128i {UI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_mullo_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.MultiplyLow(a.UI32, b.UI32);
-
-		/// <summary>
-		/// Convert packed signed 32-bit integers from "a" and "b" to packed 16-bit integers using unsigned saturation, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PACKUSDW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="b"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_packus_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.PackUnsignedSaturate(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Round the packed double-precision (64-bit) floating-point elements in "a" using the "rounding" parameter, and store the results as packed double-precision floating-point elements in "dst".	[round_note]
-		/// </summary>
-		/// <remarks><c>ROUNDPD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="rounding"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_round_pd(__m128d a, int rounding) => System.Runtime.Intrinsics.X86.Sse41.RoundToNearestInteger(a.FP64);
-
-		/// <summary>
-		/// Round the packed single-precision (32-bit) floating-point elements in "a" using the "rounding" parameter, and store the results as packed single-precision floating-point elements in "dst".	[round_note]
-		/// </summary>
-		/// <remarks><c>ROUNDPS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="rounding"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_round_ps(__m128 a, int rounding) => System.Runtime.Intrinsics.X86.Sse41.RoundToNearestInteger(a.FP32);
-
-		/// <summary>
-		/// Round the lower double-precision (64-bit) floating-point element in "b" using the "rounding" parameter, store the result as a double-precision floating-point element in the lower element of "dst", and copy the upper element from "a" to the upper element of "dst".	[round_note]
-		/// </summary>
-		/// <remarks><c>ROUNDSD xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128d {FP64}</c></param>
-		/// <param name="b"><c>__m128d {FP64}</c></param>
-		/// <param name="rounding"><c>int {IMM}</c></param>
-		/// <returns><c>__m128d dst {FP64}</c></returns>
-		public static __m128d _mm_round_sd(__m128d a, __m128d b, int rounding) => System.Runtime.Intrinsics.X86.Sse41.RoundCurrentDirectionScalar(a.FP64);
-
-		/// <summary>
-		/// Round the lower single-precision (32-bit) floating-point element in "b" using the "rounding" parameter, store the result as a single-precision floating-point element in the lower element of "dst", and copy the upper 3 packed elements from "a" to the upper elements of "dst".	[round_note]
-		/// </summary>
-		/// <remarks><c>ROUNDSS xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128 {FP32}</c></param>
-		/// <param name="b"><c>__m128 {FP32}</c></param>
-		/// <param name="rounding"><c>int {IMM}</c></param>
-		/// <returns><c>__m128 dst {FP32}</c></returns>
-		public static __m128 _mm_round_ss(__m128 a, __m128 b, int rounding) => System.Runtime.Intrinsics.X86.Sse41.RoundCurrentDirectionScalar(a.FP32);
-
-		/// <summary>
-		/// Load 128-bits of integer data from memory into "dst" using a non-temporal memory hint.	"mem_addr" must be aligned on a 16-byte boundary or a general-protection exception may be generated.
-		/// </summary>
-		/// <remarks><c>MOVNTDQA xmm, m128</c></remarks>
-		/// <param name="mem_addr"><c>__m128i {M128}</c></param>
-		/// <returns><c>__m128i dst {M128}</c></returns>
-		public static __m128i _mm_stream_load_si128(__m128i* mem_addr) => System.Runtime.Intrinsics.X86.Sse41.LoadAlignedVector128NonTemporal((sbyte*)mem_addr);
-
-		/// <summary>
-		/// Compute the bitwise AND of 128 bits (representing integer data) in "a" and "b", and set "ZF" to 1 if the result is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", and set "CF" to 1 if the result is zero, otherwise set "CF" to 0. Return the "CF" value.
-		/// </summary>
-		/// <remarks><c>PTEST xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="b"><c>__m128i {M128}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_testc_si128(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.TestC(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Compute the bitwise AND of 128 bits (representing integer data) in "a" and "b", and set "ZF" to 1 if the result is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", and set "CF" to 1 if the result is zero, otherwise set "CF" to 0. Return 1 if both the "ZF" and "CF" values are zero, otherwise return 0.
-		/// </summary>
-		/// <remarks><c>PTEST xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="b"><c>__m128i {M128}</c></param>
-		/// <returns><c>bool dst {UI8}</c></returns>
-		public static bool _mm_testnzc_si128(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.TestNotZAndNotC(a.SI8, b.SI8);
-
-		/// <summary>
-		/// Compute the bitwise AND of 128 bits (representing integer data) in "a" and "b", and set "ZF" to 1 if the result is zero, otherwise set "ZF" to 0. Compute the bitwise NOT of "a" and then AND with "b", and set "CF" to 1 if the result is zero, otherwise set "CF" to 0. Return the "ZF" value.
-		/// </summary>
-		/// <remarks><c>PTEST xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {M128}</c></param>
-		/// <param name="b"><c>__m128i {M128}</c></param>
-		/// <returns><c>bool k {UI8}</c></returns>
-		public static bool _mm_testz_si128(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse41.TestZ(a.SI8, b.SI8);
-
-	}
-}
diff --git a/src/External/RawIntrinsics/SSE42.cs b/src/External/RawIntrinsics/SSE42.cs
deleted file mode 100644
index e0b939b..0000000
--- a/src/External/RawIntrinsics/SSE42.cs
+++ /dev/null
@@ -1,15 +0,0 @@
-namespace RawIntrinsics
-{
-	public static unsafe partial class SSE42
-	{
-		/// <summary>
-		/// Compare packed signed 64-bit integers in "a" and "b" for greater-than, and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PCMPGTQ xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI64}</c></param>
-		/// <param name="b"><c>__m128i {SI64}</c></param>
-		/// <returns><c>__m128i dst {UI64}</c></returns>
-		public static __m128i _mm_cmpgt_epi64(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Sse42.CompareGreaterThan(a.SI64, b.SI64);
-
-	}
-}
diff --git a/src/External/RawIntrinsics/SSSE3.cs b/src/External/RawIntrinsics/SSSE3.cs
deleted file mode 100644
index 66c40b0..0000000
--- a/src/External/RawIntrinsics/SSSE3.cs
+++ /dev/null
@@ -1,148 +0,0 @@
-namespace RawIntrinsics
-{
-	public static unsafe partial class SSSE3
-	{
-		/// <summary>
-		/// Compute the absolute value of packed signed 16-bit integers in "a", and store the unsigned results in "dst".
-		/// </summary>
-		/// <remarks><c>PABSW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_abs_epi16(__m128i a) => System.Runtime.Intrinsics.X86.Ssse3.Abs(a.SI16);
-
-		/// <summary>
-		/// Compute the absolute value of packed signed 32-bit integers in "a", and store the unsigned results in "dst".
-		/// </summary>
-		/// <remarks><c>PABSD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_abs_epi32(__m128i a) => System.Runtime.Intrinsics.X86.Ssse3.Abs(a.SI32);
-
-		/// <summary>
-		/// Compute the absolute value of packed signed 8-bit integers in "a", and store the unsigned results in "dst".
-		/// </summary>
-		/// <remarks><c>PABSB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_abs_epi8(__m128i a) => System.Runtime.Intrinsics.X86.Ssse3.Abs(a.SI8);
-
-		/// <summary>
-		/// Concatenate 16-byte blocks in "a" and "b" into a 32-byte temporary result, shift the result right by "imm8" bytes, and store the low 16 bytes in "dst".
-		/// </summary>
-		/// <remarks><c>PALIGNR xmm, xmm, imm8</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <param name="imm8"><c>int {IMM}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_alignr_epi8(__m128i a, __m128i b, int imm8) => System.Runtime.Intrinsics.X86.Ssse3.AlignRight(a.UI8, b.UI8, (byte)imm8);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of 16-bit integers in "a" and "b", and pack the signed 16-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>PHADDW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {SI16}</c></returns>
-		public static __m128i _mm_hadd_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.HorizontalAdd(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of 32-bit integers in "a" and "b", and pack the signed 32-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>PHADDD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="b"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {SI32}</c></returns>
-		public static __m128i _mm_hadd_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.HorizontalAdd(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Horizontally add adjacent pairs of signed 16-bit integers in "a" and "b" using saturation, and pack the signed 16-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>PHADDSW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {SI16}</c></returns>
-		public static __m128i _mm_hadds_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.HorizontalAddSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Horizontally subtract adjacent pairs of 16-bit integers in "a" and "b", and pack the signed 16-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>PHSUBW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {SI16}</c></returns>
-		public static __m128i _mm_hsub_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.HorizontalSubtract(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Horizontally subtract adjacent pairs of 32-bit integers in "a" and "b", and pack the signed 32-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>PHSUBD xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="b"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {SI32}</c></returns>
-		public static __m128i _mm_hsub_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.HorizontalSubtract(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Horizontally subtract adjacent pairs of signed 16-bit integers in "a" and "b" using saturation, and pack the signed 16-bit results in "dst".
-		/// </summary>
-		/// <remarks><c>PHSUBSW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {SI16}</c></returns>
-		public static __m128i _mm_hsubs_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.HorizontalSubtractSaturate(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Vertically multiply each unsigned 8-bit integer from "a" with the corresponding signed 8-bit integer from "b", producing intermediate signed 16-bit integers. Horizontally add adjacent pairs of intermediate signed 16-bit integers, and pack the saturated results in "dst".
-		/// </summary>
-		/// <remarks><c>PMADDUBSW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {SI16}</c></returns>
-		public static __m128i _mm_maddubs_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.MultiplyAddAdjacent(a.UI8, b.SI8);
-
-		/// <summary>
-		/// Multiply packed signed 16-bit integers in "a" and "b", producing intermediate signed 32-bit integers. Truncate each intermediate integer to the 18 most significant bits, round by adding 1, and store bits [16:1] to "dst".
-		/// </summary>
-		/// <remarks><c>PMULHRSW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_mulhrs_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.MultiplyHighRoundScale(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Shuffle packed 8-bit integers in "a" according to shuffle control mask in the corresponding 8-bit element of "b", and store the results in "dst".
-		/// </summary>
-		/// <remarks><c>PSHUFB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {UI8}</c></param>
-		/// <param name="b"><c>__m128i {UI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_shuffle_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.Shuffle(a.UI8, b.UI8);
-
-		/// <summary>
-		/// Negate packed 16-bit integers in "a" when the corresponding signed 16-bit integer in "b" is negative, and store the results in "dst". Element in "dst" are zeroed out when the corresponding element in "b" is zero.
-		/// </summary>
-		/// <remarks><c>PSIGNW xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI16}</c></param>
-		/// <param name="b"><c>__m128i {SI16}</c></param>
-		/// <returns><c>__m128i dst {UI16}</c></returns>
-		public static __m128i _mm_sign_epi16(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.Sign(a.SI16, b.SI16);
-
-		/// <summary>
-		/// Negate packed 32-bit integers in "a" when the corresponding signed 32-bit integer in "b" is negative, and store the results in "dst". Element in "dst" are zeroed out when the corresponding element in "b" is zero.
-		/// </summary>
-		/// <remarks><c>PSIGND xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI32}</c></param>
-		/// <param name="b"><c>__m128i {SI32}</c></param>
-		/// <returns><c>__m128i dst {UI32}</c></returns>
-		public static __m128i _mm_sign_epi32(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.Sign(a.SI32, b.SI32);
-
-		/// <summary>
-		/// Negate packed 8-bit integers in "a" when the corresponding signed 8-bit integer in "b" is negative, and store the results in "dst". Element in "dst" are zeroed out when the corresponding element in "b" is zero.
-		/// </summary>
-		/// <remarks><c>PSIGNB xmm, xmm</c></remarks>
-		/// <param name="a"><c>__m128i {SI8}</c></param>
-		/// <param name="b"><c>__m128i {SI8}</c></param>
-		/// <returns><c>__m128i dst {UI8}</c></returns>
-		public static __m128i _mm_sign_epi8(__m128i a, __m128i b) => System.Runtime.Intrinsics.X86.Ssse3.Sign(a.SI8, b.SI8);
-
-	}
-}
diff --git a/src/External/RawIntrinsics/Types.cs b/src/External/RawIntrinsics/Types.cs
deleted file mode 100644
index c08378b..0000000
--- a/src/External/RawIntrinsics/Types.cs
+++ /dev/null
@@ -1,178 +0,0 @@
-namespace RawIntrinsics
-{
-	public struct __m64
-	{
-		private System.Runtime.Intrinsics.Vector64<byte> _;
-		public System.Runtime.Intrinsics.Vector64<byte> UI8 => System.Runtime.Intrinsics.Vector64.AsByte(_);
-		public System.Runtime.Intrinsics.Vector64<sbyte> SI8 => System.Runtime.Intrinsics.Vector64.AsSByte(_);
-		public System.Runtime.Intrinsics.Vector64<ushort> UI16 => System.Runtime.Intrinsics.Vector64.AsUInt16(_);
-		public System.Runtime.Intrinsics.Vector64<short> SI16 => System.Runtime.Intrinsics.Vector64.AsInt16(_);
-		public System.Runtime.Intrinsics.Vector64<uint> UI32 => System.Runtime.Intrinsics.Vector64.AsUInt32(_);
-		public System.Runtime.Intrinsics.Vector64<int> SI32 => System.Runtime.Intrinsics.Vector64.AsInt32(_);
-		public System.Runtime.Intrinsics.Vector64<ulong> UI64 => System.Runtime.Intrinsics.Vector64.AsUInt64(_);
-		public System.Runtime.Intrinsics.Vector64<long> SI64 => System.Runtime.Intrinsics.Vector64.AsInt64(_);
-		public System.Runtime.Intrinsics.Vector64<float> FP32 => System.Runtime.Intrinsics.Vector64.AsSingle(_);
-		public System.Runtime.Intrinsics.Vector64<double> FP64 => System.Runtime.Intrinsics.Vector64.AsDouble(_);
-		public static implicit operator __m64(System.Runtime.Intrinsics.Vector64<byte> v) => new __m64 { _ = System.Runtime.Intrinsics.Vector64.AsByte(v) };
-		public static implicit operator __m64(System.Runtime.Intrinsics.Vector64<sbyte> v) => new __m64 { _ = System.Runtime.Intrinsics.Vector64.AsByte(v) };
-		public static implicit operator __m64(System.Runtime.Intrinsics.Vector64<ushort> v) => new __m64 { _ = System.Runtime.Intrinsics.Vector64.AsByte(v) };
-		public static implicit operator __m64(System.Runtime.Intrinsics.Vector64<short> v) => new __m64 { _ = System.Runtime.Intrinsics.Vector64.AsByte(v) };
-		public static implicit operator __m64(System.Runtime.Intrinsics.Vector64<uint> v) => new __m64 { _ = System.Runtime.Intrinsics.Vector64.AsByte(v) };
-		public static implicit operator __m64(System.Runtime.Intrinsics.Vector64<int> v) => new __m64 { _ = System.Runtime.Intrinsics.Vector64.AsByte(v) };
-		public static implicit operator __m64(System.Runtime.Intrinsics.Vector64<ulong> v) => new __m64 { _ = System.Runtime.Intrinsics.Vector64.AsByte(v) };
-		public static implicit operator __m64(System.Runtime.Intrinsics.Vector64<long> v) => new __m64 { _ = System.Runtime.Intrinsics.Vector64.AsByte(v) };
-		public static implicit operator __m64(System.Runtime.Intrinsics.Vector64<float> v) => new __m64 { _ = System.Runtime.Intrinsics.Vector64.AsByte(v) };
-		public static implicit operator __m64(System.Runtime.Intrinsics.Vector64<double> v) => new __m64 { _ = System.Runtime.Intrinsics.Vector64.AsByte(v) };
-	}
-
-	public struct __m128
-	{
-		private System.Runtime.Intrinsics.Vector128<byte> _;
-		public System.Runtime.Intrinsics.Vector128<byte> UI8 => System.Runtime.Intrinsics.Vector128.AsByte(_);
-		public System.Runtime.Intrinsics.Vector128<sbyte> SI8 => System.Runtime.Intrinsics.Vector128.AsSByte(_);
-		public System.Runtime.Intrinsics.Vector128<ushort> UI16 => System.Runtime.Intrinsics.Vector128.AsUInt16(_);
-		public System.Runtime.Intrinsics.Vector128<short> SI16 => System.Runtime.Intrinsics.Vector128.AsInt16(_);
-		public System.Runtime.Intrinsics.Vector128<uint> UI32 => System.Runtime.Intrinsics.Vector128.AsUInt32(_);
-		public System.Runtime.Intrinsics.Vector128<int> SI32 => System.Runtime.Intrinsics.Vector128.AsInt32(_);
-		public System.Runtime.Intrinsics.Vector128<ulong> UI64 => System.Runtime.Intrinsics.Vector128.AsUInt64(_);
-		public System.Runtime.Intrinsics.Vector128<long> SI64 => System.Runtime.Intrinsics.Vector128.AsInt64(_);
-		public System.Runtime.Intrinsics.Vector128<float> FP32 => System.Runtime.Intrinsics.Vector128.AsSingle(_);
-		public System.Runtime.Intrinsics.Vector128<double> FP64 => System.Runtime.Intrinsics.Vector128.AsDouble(_);
-		public static implicit operator __m128(System.Runtime.Intrinsics.Vector128<byte> v) => new __m128 { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128(System.Runtime.Intrinsics.Vector128<sbyte> v) => new __m128 { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128(System.Runtime.Intrinsics.Vector128<ushort> v) => new __m128 { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128(System.Runtime.Intrinsics.Vector128<short> v) => new __m128 { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128(System.Runtime.Intrinsics.Vector128<uint> v) => new __m128 { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128(System.Runtime.Intrinsics.Vector128<int> v) => new __m128 { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128(System.Runtime.Intrinsics.Vector128<ulong> v) => new __m128 { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128(System.Runtime.Intrinsics.Vector128<long> v) => new __m128 { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128(System.Runtime.Intrinsics.Vector128<float> v) => new __m128 { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128(System.Runtime.Intrinsics.Vector128<double> v) => new __m128 { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-	}
-
-	public struct __m128i
-	{
-		private System.Runtime.Intrinsics.Vector128<byte> _;
-		public System.Runtime.Intrinsics.Vector128<byte> UI8 => System.Runtime.Intrinsics.Vector128.AsByte(_);
-		public System.Runtime.Intrinsics.Vector128<sbyte> SI8 => System.Runtime.Intrinsics.Vector128.AsSByte(_);
-		public System.Runtime.Intrinsics.Vector128<ushort> UI16 => System.Runtime.Intrinsics.Vector128.AsUInt16(_);
-		public System.Runtime.Intrinsics.Vector128<short> SI16 => System.Runtime.Intrinsics.Vector128.AsInt16(_);
-		public System.Runtime.Intrinsics.Vector128<uint> UI32 => System.Runtime.Intrinsics.Vector128.AsUInt32(_);
-		public System.Runtime.Intrinsics.Vector128<int> SI32 => System.Runtime.Intrinsics.Vector128.AsInt32(_);
-		public System.Runtime.Intrinsics.Vector128<ulong> UI64 => System.Runtime.Intrinsics.Vector128.AsUInt64(_);
-		public System.Runtime.Intrinsics.Vector128<long> SI64 => System.Runtime.Intrinsics.Vector128.AsInt64(_);
-		public System.Runtime.Intrinsics.Vector128<float> FP32 => System.Runtime.Intrinsics.Vector128.AsSingle(_);
-		public System.Runtime.Intrinsics.Vector128<double> FP64 => System.Runtime.Intrinsics.Vector128.AsDouble(_);
-		public static implicit operator __m128i(System.Runtime.Intrinsics.Vector128<byte> v) => new __m128i { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128i(System.Runtime.Intrinsics.Vector128<sbyte> v) => new __m128i { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128i(System.Runtime.Intrinsics.Vector128<ushort> v) => new __m128i { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128i(System.Runtime.Intrinsics.Vector128<short> v) => new __m128i { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128i(System.Runtime.Intrinsics.Vector128<uint> v) => new __m128i { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128i(System.Runtime.Intrinsics.Vector128<int> v) => new __m128i { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128i(System.Runtime.Intrinsics.Vector128<ulong> v) => new __m128i { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128i(System.Runtime.Intrinsics.Vector128<long> v) => new __m128i { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128i(System.Runtime.Intrinsics.Vector128<float> v) => new __m128i { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128i(System.Runtime.Intrinsics.Vector128<double> v) => new __m128i { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-	}
-
-	public struct __m128d
-	{
-		private System.Runtime.Intrinsics.Vector128<byte> _;
-		public System.Runtime.Intrinsics.Vector128<byte> UI8 => System.Runtime.Intrinsics.Vector128.AsByte(_);
-		public System.Runtime.Intrinsics.Vector128<sbyte> SI8 => System.Runtime.Intrinsics.Vector128.AsSByte(_);
-		public System.Runtime.Intrinsics.Vector128<ushort> UI16 => System.Runtime.Intrinsics.Vector128.AsUInt16(_);
-		public System.Runtime.Intrinsics.Vector128<short> SI16 => System.Runtime.Intrinsics.Vector128.AsInt16(_);
-		public System.Runtime.Intrinsics.Vector128<uint> UI32 => System.Runtime.Intrinsics.Vector128.AsUInt32(_);
-		public System.Runtime.Intrinsics.Vector128<int> SI32 => System.Runtime.Intrinsics.Vector128.AsInt32(_);
-		public System.Runtime.Intrinsics.Vector128<ulong> UI64 => System.Runtime.Intrinsics.Vector128.AsUInt64(_);
-		public System.Runtime.Intrinsics.Vector128<long> SI64 => System.Runtime.Intrinsics.Vector128.AsInt64(_);
-		public System.Runtime.Intrinsics.Vector128<float> FP32 => System.Runtime.Intrinsics.Vector128.AsSingle(_);
-		public System.Runtime.Intrinsics.Vector128<double> FP64 => System.Runtime.Intrinsics.Vector128.AsDouble(_);
-		public static implicit operator __m128d(System.Runtime.Intrinsics.Vector128<byte> v) => new __m128d { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128d(System.Runtime.Intrinsics.Vector128<sbyte> v) => new __m128d { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128d(System.Runtime.Intrinsics.Vector128<ushort> v) => new __m128d { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128d(System.Runtime.Intrinsics.Vector128<short> v) => new __m128d { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128d(System.Runtime.Intrinsics.Vector128<uint> v) => new __m128d { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128d(System.Runtime.Intrinsics.Vector128<int> v) => new __m128d { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128d(System.Runtime.Intrinsics.Vector128<ulong> v) => new __m128d { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128d(System.Runtime.Intrinsics.Vector128<long> v) => new __m128d { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128d(System.Runtime.Intrinsics.Vector128<float> v) => new __m128d { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-		public static implicit operator __m128d(System.Runtime.Intrinsics.Vector128<double> v) => new __m128d { _ = System.Runtime.Intrinsics.Vector128.AsByte(v) };
-	}
-
-	public struct __m256
-	{
-		private System.Runtime.Intrinsics.Vector256<byte> _;
-		public System.Runtime.Intrinsics.Vector256<byte> UI8 => System.Runtime.Intrinsics.Vector256.AsByte(_);
-		public System.Runtime.Intrinsics.Vector256<sbyte> SI8 => System.Runtime.Intrinsics.Vector256.AsSByte(_);
-		public System.Runtime.Intrinsics.Vector256<ushort> UI16 => System.Runtime.Intrinsics.Vector256.AsUInt16(_);
-		public System.Runtime.Intrinsics.Vector256<short> SI16 => System.Runtime.Intrinsics.Vector256.AsInt16(_);
-		public System.Runtime.Intrinsics.Vector256<uint> UI32 => System.Runtime.Intrinsics.Vector256.AsUInt32(_);
-		public System.Runtime.Intrinsics.Vector256<int> SI32 => System.Runtime.Intrinsics.Vector256.AsInt32(_);
-		public System.Runtime.Intrinsics.Vector256<ulong> UI64 => System.Runtime.Intrinsics.Vector256.AsUInt64(_);
-		public System.Runtime.Intrinsics.Vector256<long> SI64 => System.Runtime.Intrinsics.Vector256.AsInt64(_);
-		public System.Runtime.Intrinsics.Vector256<float> FP32 => System.Runtime.Intrinsics.Vector256.AsSingle(_);
-		public System.Runtime.Intrinsics.Vector256<double> FP64 => System.Runtime.Intrinsics.Vector256.AsDouble(_);
-		public static implicit operator __m256(System.Runtime.Intrinsics.Vector256<byte> v) => new __m256 { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256(System.Runtime.Intrinsics.Vector256<sbyte> v) => new __m256 { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256(System.Runtime.Intrinsics.Vector256<ushort> v) => new __m256 { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256(System.Runtime.Intrinsics.Vector256<short> v) => new __m256 { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256(System.Runtime.Intrinsics.Vector256<uint> v) => new __m256 { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256(System.Runtime.Intrinsics.Vector256<int> v) => new __m256 { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256(System.Runtime.Intrinsics.Vector256<ulong> v) => new __m256 { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256(System.Runtime.Intrinsics.Vector256<long> v) => new __m256 { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256(System.Runtime.Intrinsics.Vector256<float> v) => new __m256 { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256(System.Runtime.Intrinsics.Vector256<double> v) => new __m256 { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-	}
-
-	public struct __m256i
-	{
-		private System.Runtime.Intrinsics.Vector256<byte> _;
-		public System.Runtime.Intrinsics.Vector256<byte> UI8 => System.Runtime.Intrinsics.Vector256.AsByte(_);
-		public System.Runtime.Intrinsics.Vector256<sbyte> SI8 => System.Runtime.Intrinsics.Vector256.AsSByte(_);
-		public System.Runtime.Intrinsics.Vector256<ushort> UI16 => System.Runtime.Intrinsics.Vector256.AsUInt16(_);
-		public System.Runtime.Intrinsics.Vector256<short> SI16 => System.Runtime.Intrinsics.Vector256.AsInt16(_);
-		public System.Runtime.Intrinsics.Vector256<uint> UI32 => System.Runtime.Intrinsics.Vector256.AsUInt32(_);
-		public System.Runtime.Intrinsics.Vector256<int> SI32 => System.Runtime.Intrinsics.Vector256.AsInt32(_);
-		public System.Runtime.Intrinsics.Vector256<ulong> UI64 => System.Runtime.Intrinsics.Vector256.AsUInt64(_);
-		public System.Runtime.Intrinsics.Vector256<long> SI64 => System.Runtime.Intrinsics.Vector256.AsInt64(_);
-		public System.Runtime.Intrinsics.Vector256<float> FP32 => System.Runtime.Intrinsics.Vector256.AsSingle(_);
-		public System.Runtime.Intrinsics.Vector256<double> FP64 => System.Runtime.Intrinsics.Vector256.AsDouble(_);
-		public static implicit operator __m256i(System.Runtime.Intrinsics.Vector256<byte> v) => new __m256i { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256i(System.Runtime.Intrinsics.Vector256<sbyte> v) => new __m256i { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256i(System.Runtime.Intrinsics.Vector256<ushort> v) => new __m256i { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256i(System.Runtime.Intrinsics.Vector256<short> v) => new __m256i { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256i(System.Runtime.Intrinsics.Vector256<uint> v) => new __m256i { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256i(System.Runtime.Intrinsics.Vector256<int> v) => new __m256i { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256i(System.Runtime.Intrinsics.Vector256<ulong> v) => new __m256i { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256i(System.Runtime.Intrinsics.Vector256<long> v) => new __m256i { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256i(System.Runtime.Intrinsics.Vector256<float> v) => new __m256i { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256i(System.Runtime.Intrinsics.Vector256<double> v) => new __m256i { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-	}
-
-	public struct __m256d
-	{
-		private System.Runtime.Intrinsics.Vector256<byte> _;
-		public System.Runtime.Intrinsics.Vector256<byte> UI8 => System.Runtime.Intrinsics.Vector256.AsByte(_);
-		public System.Runtime.Intrinsics.Vector256<sbyte> SI8 => System.Runtime.Intrinsics.Vector256.AsSByte(_);
-		public System.Runtime.Intrinsics.Vector256<ushort> UI16 => System.Runtime.Intrinsics.Vector256.AsUInt16(_);
-		public System.Runtime.Intrinsics.Vector256<short> SI16 => System.Runtime.Intrinsics.Vector256.AsInt16(_);
-		public System.Runtime.Intrinsics.Vector256<uint> UI32 => System.Runtime.Intrinsics.Vector256.AsUInt32(_);
-		public System.Runtime.Intrinsics.Vector256<int> SI32 => System.Runtime.Intrinsics.Vector256.AsInt32(_);
-		public System.Runtime.Intrinsics.Vector256<ulong> UI64 => System.Runtime.Intrinsics.Vector256.AsUInt64(_);
-		public System.Runtime.Intrinsics.Vector256<long> SI64 => System.Runtime.Intrinsics.Vector256.AsInt64(_);
-		public System.Runtime.Intrinsics.Vector256<float> FP32 => System.Runtime.Intrinsics.Vector256.AsSingle(_);
-		public System.Runtime.Intrinsics.Vector256<double> FP64 => System.Runtime.Intrinsics.Vector256.AsDouble(_);
-		public static implicit operator __m256d(System.Runtime.Intrinsics.Vector256<byte> v) => new __m256d { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256d(System.Runtime.Intrinsics.Vector256<sbyte> v) => new __m256d { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256d(System.Runtime.Intrinsics.Vector256<ushort> v) => new __m256d { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256d(System.Runtime.Intrinsics.Vector256<short> v) => new __m256d { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256d(System.Runtime.Intrinsics.Vector256<uint> v) => new __m256d { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256d(System.Runtime.Intrinsics.Vector256<int> v) => new __m256d { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256d(System.Runtime.Intrinsics.Vector256<ulong> v) => new __m256d { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256d(System.Runtime.Intrinsics.Vector256<long> v) => new __m256d { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256d(System.Runtime.Intrinsics.Vector256<float> v) => new __m256d { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-		public static implicit operator __m256d(System.Runtime.Intrinsics.Vector256<double> v) => new __m256d { _ = System.Runtime.Intrinsics.Vector256.AsByte(v) };
-	}
-
-}
diff --git a/src/External/RawIntrinsics/Utils.ManuallyAdded.cs b/src/External/RawIntrinsics/Utils.ManuallyAdded.cs
deleted file mode 100644
index 314cb9d..0000000
--- a/src/External/RawIntrinsics/Utils.ManuallyAdded.cs
+++ /dev/null
@@ -1,7 +0,0 @@
-﻿namespace RawIntrinsics
-{
-	public static class Utils
-	{
-		public static int _MM_SHUFFLE(int z, int y, int x, int w) => (z << 6) | (y << 4) | (x << 2) | w;
-	}
-}
diff --git a/src/External/RawIntrinsicsGenerator/Generator.cs b/src/External/RawIntrinsicsGenerator/Generator.cs
deleted file mode 100644
index 7eeb8b8..0000000
--- a/src/External/RawIntrinsicsGenerator/Generator.cs
+++ /dev/null
@@ -1,556 +0,0 @@
-using System.Collections.Concurrent;
-using System.Diagnostics;
-using System.Runtime.Intrinsics;
-using System.Text;
-using System.Text.RegularExpressions;
-using System.Xml;
-
-using Microsoft.CodeAnalysis;
-using Microsoft.CodeAnalysis.CSharp;
-using Microsoft.CodeAnalysis.CSharp.Syntax;
-
-namespace RawIntrinsicsGenerator
-{
-    public static class Generator
-	{
-		private const string SriDataUrl1 = @"https://raw.githubusercontent.com/dotnet/runtime/release/7.0/src/libraries/System.Private.CoreLib/src/System/Runtime/Intrinsics/X86/";
-		private const string SriDataUrl2 = @"https://raw.githubusercontent.com/dotnet/runtime/release/7.0/src/libraries/System.Private.CoreLib/src/System/Runtime/Intrinsics/";
-		private const string IntelDataUrl = @"https://www.intel.com/content/dam/develop/public/us/en/include/intrinsics-guide/data-3-6-5.xml";
-		
-		private static readonly Regex IntelMethodSignature = new(@"///\s+?(?<rt>[\w_]+)\s+?(?<fn>_mm[\w_]+)\s*?\((?<a>[\w\s,*]+)\)", RegexOptions.Compiled);
-		private static readonly Regex IntelMethodSignatureSimpilfied = new(@"\s+?(?<rt>[\w_]+)\s+?(?<fn>_mm[\w_]+)\s*?", RegexOptions.Compiled);
-		private static readonly Regex IntelTypeDef = new(@"(?:(?<is_unsigned>unsigned)\s+?)?(?:const\s+)?(?<type_name>void|char|short|int|long|long\s+?long|float|double|__int32|__int64|(?:(?:__m64|__m128|__m256)(?:i|d)?)|__mmask8|__mmask16|__mmask32|__mmask64)[^*""]*(?<is_ptr>\*)?", RegexOptions.Compiled);
-
-		private static readonly Dictionary<string, (string srcUrl, Regex matcher)> TechnologyMap = new()
-		{
-			{"Sse", (SriDataUrl1, IntelMethodSignature)},
-			{"Sse2", (SriDataUrl1, IntelMethodSignature)},
-			{"Sse3", (SriDataUrl1, IntelMethodSignature)},
-			{"Sse41", (SriDataUrl1, IntelMethodSignature)},
-			{"Sse42", (SriDataUrl1, IntelMethodSignature)},
-			{"Ssse3", (SriDataUrl1, IntelMethodSignature)},
-			{"Avx", (SriDataUrl1, IntelMethodSignature)},
-			{"Avx2", (SriDataUrl1, IntelMethodSignature)},
-			{"Fma", (SriDataUrl1, IntelMethodSignature)},
-			{"Aes", (SriDataUrl1, IntelMethodSignature)},
-			{"Bmi1", (SriDataUrl1, IntelMethodSignature)},
-			{"Bmi2", (SriDataUrl1, IntelMethodSignature)},
-			{"Lzcnt", (SriDataUrl1, IntelMethodSignature)},
-			{"Popcnt", (SriDataUrl1, IntelMethodSignature)},
-			{"Pclmulqdq", (SriDataUrl1, IntelMethodSignature)},
-			{"Vector64", (SriDataUrl2, IntelMethodSignatureSimpilfied)},
-			{"Vector128", (SriDataUrl2, IntelMethodSignatureSimpilfied)},
-			{"Vector256", (SriDataUrl2, IntelMethodSignatureSimpilfied)},
-		};
-
-		public static async Task Generate(string ns, string saveToPath)
-		{
-			var intelDataFile = await FetchFileContent(IntelDataUrl);
-            intelDataFile = intelDataFile.Trim();
-
-            var xml = new XmlDocument(); 
-			xml.LoadXml(intelDataFile);
-			var intelData = new ConcurrentBag<XmlNode>(xml.SelectNodes(@"//intrinsic")?.Cast<XmlNode>().ToList() ?? new List<XmlNode>());
-
-			var outputData = new ConcurrentDictionary<string, ConcurrentDictionary<string, string>>();
-
-			foreach (var kv in TechnologyMap)
-			{
-				await Generate($"{kv.Value.srcUrl}{kv.Key}.cs", kv.Value.matcher, intelData, outputData);
-			}
-
-			if (Directory.Exists(saveToPath))
-			{
-				foreach(var fi in new DirectoryInfo(saveToPath).GetFiles())
-				{
-					fi.Delete();
-				}
-				Directory.Delete(saveToPath);
-			}
-			Directory.CreateDirectory(saveToPath);
-			
-			var codeGenSb = new StringBuilder();
-			string tabOffset;
-			foreach (var (tech, generatedSrc) in outputData)
-			{
-				codeGenSb.Clear();
-				tabOffset = "";
-				codeGenSb.AppendLine($"{tabOffset}namespace {ns}");
-				codeGenSb.AppendLine($"{tabOffset}{{");
-
-				tabOffset = "\t";
-				codeGenSb.AppendLine($"{tabOffset}public static unsafe partial class {tech}");
-				codeGenSb.AppendLine($"{tabOffset}{{");
-				
-				foreach (var intelMethodName in generatedSrc.Keys.OrderBy(_ => _))
-				{
-					codeGenSb.AppendLine(generatedSrc[intelMethodName]);
-				}
-				
-				tabOffset = "\t";
-				codeGenSb.AppendLine($"{tabOffset}}}");
-				
-				tabOffset = "";
-				codeGenSb.AppendLine($"{tabOffset}}}");
-				
-				await File.WriteAllTextAsync(Path.Combine(saveToPath, $"{tech}.cs"), codeGenSb.ToString());
-			}
-
-			codeGenSb.Clear();
-			tabOffset = "";
-			codeGenSb.AppendLine($"{tabOffset}namespace {ns}");
-			codeGenSb.AppendLine($"{tabOffset}{{");
-
-			foreach (var t in new[] {(64, null), (128, null), (128, "i"), (128, "d"), (256, null), (256, "i"), (256, "d")})
-			{
-				var (size, pf) = t;
-				codeGenSb.AppendLine(GenerateMType(size, pf));
-			}
-			tabOffset = "";
-			codeGenSb.AppendLine($"{tabOffset}}}");
-
-			await File.WriteAllTextAsync(Path.Combine(saveToPath, $"Types.cs"), codeGenSb.ToString());
-		}
-
-		private static readonly (string etype, string convFn)[] EtypeToReninterpretMethodMap = {("UI8", "AsByte"), ("SI8", "AsSByte"), ("UI16", "AsUInt16"), ("SI16", "AsInt16"), ("UI32", "AsUInt32"), ("SI32", "AsInt32"), ("UI64", "AsUInt64"), ("SI64", "AsInt64"), ("FP32", "AsSingle"), ("FP64", "AsDouble")};
-		
-		private static string GenerateMType(int size, string pf = null)
-		{
-			var mTypeName = pf == null ? $"__m{size}" : $"__m{size}{pf}" ;
-			var codeGenSb = new StringBuilder();
-
-			var csVectorTypeName = $"System.Runtime.Intrinsics.Vector{size}";
-			
-			var tabOffset = "\t";
-			codeGenSb.AppendLine($"{tabOffset}public struct {mTypeName}");
-			codeGenSb.AppendLine($"{tabOffset}{{");
-
-			tabOffset = "\t\t";
-			codeGenSb.AppendLine($"{tabOffset}private {csVectorTypeName}<byte> _;");
-
-			foreach (var (etype, convFn) in EtypeToReninterpretMethodMap)
-			{
-				var csType = EtypeToCsTypeName(etype);
-				codeGenSb.AppendLine($"{tabOffset}public {csVectorTypeName}<{csType}> {etype} => {csVectorTypeName}.{convFn}(_);");
-			}
-
-			foreach (var (etype, _) in EtypeToReninterpretMethodMap)
-			{
-				var csType = EtypeToCsTypeName(etype);
-				codeGenSb.AppendLine($"{tabOffset}public static implicit operator {mTypeName}({csVectorTypeName}<{csType}> v) => new {mTypeName} {{ _ = {csVectorTypeName}.AsByte(v) }};");
-			}
-
-			tabOffset = "\t";
-			codeGenSb.AppendLine($"{tabOffset}}}");
-			return codeGenSb.ToString();
-		}
-
-		private static async Task Generate(string sriUrl, Regex cppIntrinsicNameMatcher, ConcurrentBag<XmlNode> intelData, ConcurrentDictionary<string, ConcurrentDictionary<string, string>> outputData)
-		{
-			var intelMethod2CsMethodMap = new Dictionary<string, List<CsMethod>>();
-
-			var sriData = await FetchFileContent(sriUrl);
-
-			var syntaxTree = CSharpSyntaxTree.ParseText(sriData);
-			var compilation = CSharpCompilation.Create("Test").AddReferences(MetadataReference.CreateFromFile(typeof(object).Assembly.Location)).AddReferences(MetadataReference.CreateFromFile(typeof(Vector128).Assembly.Location)).AddSyntaxTrees(syntaxTree);
-			var semanticModel = compilation.GetSemanticModel(syntaxTree);
-			var syntaxTreeRoot = (CompilationUnitSyntax) await syntaxTree.GetRootAsync();
-
-			var methodDeclarations = syntaxTreeRoot.DescendantNodes(_ => true, true).OfType<MethodDeclarationSyntax>();
-
-			foreach (var methodDeclaration in methodDeclarations)
-			{
-				SyntaxTrivia comments = default;
-				if (!methodDeclaration.HasLeadingTrivia || methodDeclaration.GetLeadingTrivia().All(t => (comments = t).Kind() != SyntaxKind.SingleLineDocumentationCommentTrivia || comments.GetStructure() is not DocumentationCommentTriviaSyntax)) continue;
-
-				Match match = default;
-				var _ = ((DocumentationCommentTriviaSyntax) comments.GetStructure()).Content.OfType<XmlElementSyntax>().FirstOrDefault(x => (match = cppIntrinsicNameMatcher.Match(x.Content.ToFullString())).Success);
-
-				if (!match.Success) continue;
-
-				var methodSymbol = semanticModel.GetDeclaredSymbol(methodDeclaration);
-				var csMethod = new CsMethod
-				{
-					Name = methodDeclaration.Identifier.ToString(),
-					ClassPath = methodSymbol.ReceiverType.ToDisplayString(),
-					Parameters = new CsMethodParam[methodSymbol.Parameters.Length]
-				};
-
-				if (IsCsIntrinsicType(methodSymbol.ReturnType.Name))
-				{
-					csMethod.ReturnType.Name = methodSymbol.ReturnType.Name;
-					csMethod.ReturnType.TypeParameter = methodDeclaration.ReturnType is GenericNameSyntax returnType ? returnType.TypeArgumentList.Arguments[0].ToString() : null;
-				}
-				else if (methodSymbol.ReturnType is not INamedTypeSymbol {IsGenericType: true})
-				{
-					if (methodDeclaration.ReturnType is PointerTypeSyntax)
-					{
-						csMethod.ReturnType.Name = ((IPointerTypeSymbol) methodSymbol.ReturnType).PointedAtType.ToDisplayString();
-						csMethod.ReturnType.IsPointer = true;
-					}
-					else
-					{
-						csMethod.ReturnType.Name = methodSymbol.ReturnType.ToDisplayString();
-					}
-				}
-				else
-				{
-					throw new InvalidOperationException($"Unknown return type {methodSymbol.ReturnType.Name}");
-				}
-
-				for (var j = 0; j < methodSymbol.Parameters.Length; j++)
-				{
-					var parameter = methodDeclaration.ParameterList.Parameters[j];
-
-					var parameterSymbol = methodSymbol.Parameters[j];
-					var csParameter = new CsMethodParam {Name = parameterSymbol.Name};
-					if (parameterSymbol.Type is not INamedTypeSymbol {IsGenericType: true} || !IsCsIntrinsicType(parameterSymbol.Type.Name))
-					{
-						if (parameter.Type is PointerTypeSyntax)
-						{
-							csParameter.Type = new CsType
-							{
-								Name = ((IPointerTypeSymbol) parameterSymbol.Type).PointedAtType.ToDisplayString(),
-								IsPointer = true
-							};
-						}
-						else
-						{
-							csParameter.Type = new CsType {Name = parameterSymbol.Type.ToDisplayString()};
-						}
-
-						csMethod.Parameters[j] = csParameter;
-						continue;
-					}
-
-					var parameterTypeArgument = parameter.Type is GenericNameSyntax parameterType ? parameterType.TypeArgumentList.Arguments[0].ToString() : null;
-					csParameter.Type = new CsType
-					{
-						Name = parameterSymbol.Type.Name,
-						TypeParameter = parameterTypeArgument
-					};
-					csMethod.Parameters[j] = csParameter;
-				}
-
-				var intelName = match.Groups["fn"].Value;
-
-				if (!intelMethod2CsMethodMap.ContainsKey(intelName))
-				{
-					intelMethod2CsMethodMap[intelName] = new List<CsMethod>();
-				}
-
-				intelMethod2CsMethodMap[intelName].Add(csMethod);
-			}
-
-			foreach (var (intelMethodName, csMethods) in intelMethod2CsMethodMap)
-			{
-				var intelDataNode = intelData.FirstOrDefault(x => x.Attributes?.GetNamedItem("name")?.Value?.AsSpan().Equals(intelMethodName, StringComparison.InvariantCultureIgnoreCase) ?? false);
-				if (intelDataNode == null)
-				{
-					Debug.WriteLine(intelMethodName);
-					continue;
-				}
-
-				var tech = intelDataNode?.Attributes?.GetNamedItem("tech")?.Value.Replace(".", "");
-				var intelDataNodeReturn = intelDataNode?.SelectSingleNode("return");
-
-				var intelMethod = new IntelMethod
-				{
-					Name = intelDataNode?.Attributes?.GetNamedItem("name")?.Value,
-					Return = new IntelMethodParam
-					{
-						Name = intelDataNodeReturn?.Attributes?.GetNamedItem("varname")?.Value,
-						Type = ParseIntelType(intelDataNodeReturn?.Attributes?.GetNamedItem("type")?.Value, intelDataNodeReturn?.Attributes?.GetNamedItem("etype")?.Value)
-					},
-					Description = intelDataNode?.SelectNodes(@"description")?.Cast<XmlNode>().Select(n => n.InnerText.Replace(Environment.NewLine, "")).FirstOrDefault(),
-					Instructions = intelDataNode?.SelectNodes(@"instruction")?.Cast<XmlNode>().Select(n => $"{n?.Attributes?.GetNamedItem("name")?.Value} {n?.Attributes?.GetNamedItem("form")?.Value}").FirstOrDefault(),
-				};
-
-				var intelMethodParameters = intelDataNode?.SelectNodes(@"parameter")?.Cast<XmlNode>().Select(x => new IntelMethodParam
-				{
-					Name = x.Attributes?.GetNamedItem("varname")?.Value,
-					Type = ParseIntelType(x.Attributes?.GetNamedItem("type")?.Value, x.Attributes?.GetNamedItem("etype")?.Value)
-				}).ToArray();
-				intelMethod.Parameters = intelMethodParameters.Where(x => x.Type.Name != "void" || x.Type.IsPointer).ToArray();
-
-				if (csMethods.Count == 0)
-				{
-					throw new InvalidOperationException($"No method matching Intel's {intelMethodName} found in SR.Intrinsics namespace");
-				}
-
-				var csMethod = FindMostSuited(intelMethod, csMethods);
-				if (!csMethod.ReturnType.IsPointer && csMethod.ReturnType.Name == "bool" && intelMethod.Return.Type.Name == "int")
-				{
-					intelMethod.Return.Type = new IntelType
-					{
-						Name = csMethod.ReturnType.Name,
-						CsType = csMethod.ReturnType,
-						Hint = "UI8"
-					};
-				}
-
-				var mappedParameters = new List<string>();
-				for (var k = 0; k < intelMethod.Parameters.Length; k++)
-				{
-					if (csMethod.Parameters.Length == k) break;
-					var intelMethodParameter = intelMethod.Parameters[k];
-					var csMethodParameter = csMethod.Parameters[k];
-
-					if (IsCsIntrinsicType(csMethodParameter.Type.Name))
-					{
-						mappedParameters.Add($"{intelMethodParameter.Name}.{CsTypeNameToEtype(csMethodParameter.Type.TypeParameter)}");
-						continue;
-					}
-
-					if (intelMethodParameter.Type.Name == csMethodParameter.Type.Name)
-					{
-						mappedParameters.Add($"{intelMethodParameter.Name}");
-						continue;
-					}
-
-					if (csMethodParameter.Type.IsPointer && !intelMethodParameter.Type.IsPointer)
-					{
-						mappedParameters.Add($"({csMethodParameter.Type})&{intelMethodParameter.Name}");
-					}
-					else
-					{
-						mappedParameters.Add($"({csMethodParameter.Type}){intelMethodParameter.Name}");
-					}
-				}
-
-				var codeGenSb = new StringBuilder();
-				var tabOffset = "\t\t";
-				var returnCast = "";
-				if (!IsCsIntrinsicType(csMethod.ReturnType.Name) && csMethod.ReturnType.Name != intelMethod.Return.Type.Name)
-				{
-					returnCast = $"({intelMethod.Return.Type.ToRenderString()})";
-				}
-
-				codeGenSb.AppendLine($"{tabOffset}/// <summary>");
-				codeGenSb.AppendLine($"{tabOffset}/// {intelMethod.Description}");
-				codeGenSb.AppendLine($"{tabOffset}/// </summary>");
-				codeGenSb.AppendLine($"{tabOffset}/// <remarks><c>{intelMethod.Instructions}</c></remarks>");
-				foreach (var intelMethodParameter in intelMethod.Parameters)
-				{
-					codeGenSb.AppendLine($"{tabOffset}/// <param name=\"{intelMethodParameter.Name}\"><c>{intelMethodParameter.Type.Name} {{{intelMethodParameter.Type.Hint}}}</c></param>");
-				}
-
-				codeGenSb.AppendLine($"{tabOffset}/// <returns><c>{intelMethod.Return.Type.Name} {intelMethod.Return.Name} {{{intelMethod.Return.Type.Hint}}}</c></returns>");
-				codeGenSb.AppendLine($"{tabOffset}public static {intelMethod.ToRenderString()} => {returnCast}{csMethod.ClassPath}.{csMethod.Name}({string.Join(", ", mappedParameters)});");
-
-				if (!outputData.ContainsKey(tech))
-				{
-					outputData[tech] = new ConcurrentDictionary<string, string>();
-				}
-				outputData[tech][intelMethodName] = codeGenSb.ToString();
-			}
-		}
-
-		private static async Task<string> FetchFileContent(string url)
-		{
-			var request = new HttpRequestMessage
-			{
-				Method = HttpMethod.Get,
-				RequestUri = new Uri(url),
-			};
-			var client = new HttpClient();
-			var result = await client.SendAsync(request);
-			return await result.Content.ReadAsStringAsync();
-		}
-
-		private static string CsTypeNameToEtype(string cst)
-		{
-			return cst switch
-			{
-				"byte" => "UI8",
-				"sbyte" => "SI8",
-				"ushort" => "UI16",
-				"short" => "SI16",
-				"uint" => "UI32",
-				"int" => "SI32",
-				"ulong" => "UI64",
-				"long" => "SI64",
-				"float" => "FP32",
-				"double" => "FP64",
-				_ => null
-			};
-		}
-
-		private static string EtypeToCsTypeName(string et)
-		{
-			return et switch
-			{
-				"UI8" => "byte",
-				"SI8" => "sbyte",
-				"UI16" => "ushort",
-				"SI16" => "short",
-				"UI32" => "uint",
-				"SI32" => "int",
-				"UI64" => "ulong",
-				"SI64" => "long",
-				"FP32" => "float",
-				"FP64" => "double",
-				_ => null
-			};
-		}
-
-		private static IntelType ParseIntelType(string type, string etype)
-		{
-			var match = IntelTypeDef.Match(type);
-			if (!match.Success)
-			{
-				throw new InvalidOperationException($"Unknown Intel's type {type}");
-			}
-
-			static string IntelTypeNameToSystemTypeName(string itn)
-			{
-				return itn switch
-				{
-					"__int8" or "char" or "__mmask8" => "byte",
-					"__int16" or "__mmask16" => "short",
-					"__int32" or "__mmask32" => "int",
-					"__int64" or "long long" or "__mmask64" => "long",
-					_ => itn
-				};
-			}
-
-			var isUnsigned = match.Groups["is_unsigned"].Success;
-			var isPointer = match.Groups["is_ptr"].Success;
-			var intelTypeName = IntelTypeNameToSystemTypeName(match.Groups["type_name"].Value);
-			var csType = intelTypeName switch
-			{
-				"void" => new CsType
-				{
-					Name = "void",
-					IsPointer = isPointer
-				},
-				"byte" => new CsType
-				{
-					Name = EtypeToCsTypeName(etype) ?? (isUnsigned ? "byte" : "sbyte"),
-					IsPointer = isPointer
-				},
-				"short" => new CsType
-				{
-					Name = EtypeToCsTypeName(etype) ?? (isUnsigned ? "ushort" : "short"),
-					IsPointer = isPointer
-				},
-				"int" => new CsType
-				{
-					Name = EtypeToCsTypeName(etype) ?? (isUnsigned ? "uint" : "int"),
-					IsPointer = isPointer
-				},
-				"long" => new CsType
-				{
-					Name = EtypeToCsTypeName(etype) ?? (isUnsigned ? "ulong" : "long"),
-					IsPointer = isPointer
-				},
-				"float" => new CsType
-				{
-					Name = "float",
-					IsPointer = isPointer
-				},
-				"double" => new CsType
-				{
-					Name = "double",
-					IsPointer = isPointer
-				},
-				"__m64" or "__m64i" or "__m64d" => new CsType
-				{
-					Name = "Vector64",
-					IsPointer = isPointer,
-					TypeParameter = EtypeToCsTypeName(etype)
-				},
-				"__m128" or "__m128i" or "__m128d" => new CsType
-				{
-					Name = "Vector128",
-					IsPointer = isPointer,
-					TypeParameter = EtypeToCsTypeName(etype)
-				},
-				"__m256" or "__m256i" or "__m256d" => new CsType
-				{
-					Name = "Vector256",
-					IsPointer = isPointer,
-					TypeParameter = EtypeToCsTypeName(etype)
-				},
-				_ => throw new InvalidOperationException($"No type matching Intel's {intelTypeName} found")
-			};
-			return new IntelType
-			{
-				Name = intelTypeName,
-				IsPointer = isPointer,
-				Hint = etype,
-				CsType = csType
-			};
-		}
-
-		private static bool IsCsIntrinsicType(string name) => name == nameof(Vector64) || name == nameof(Vector128) || name == nameof(Vector256);
-		
-		private static CsMethod FindMostSuited(IntelMethod intelMethod, List<CsMethod> csMethods)
-		{
-			foreach (var csMethod in csMethods.Where(csMethod => csMethod.Parameters.Length > 0 && intelMethod.Parameters[0].Type.CsType.Name == csMethod.Parameters[0].Type.Name && intelMethod.Parameters[0].Type.CsType.TypeParameter == csMethod.Parameters[0].Type.TypeParameter))
-			{
-				return csMethod;
-			}
-
-			return csMethods[0];
-		}
-
-		private struct CsType
-		{
-			public string Name;
-			public string TypeParameter;
-			public bool IsPointer;
-
-			public override string ToString()
-			{
-				var name = TypeParameter == null ? Name : $"{Name}<{TypeParameter}>";
-				return IsPointer ? $"{name}*" : $"{name}";
-			}
-		}
-
-		private struct CsMethod
-		{
-			public string ClassPath;
-			public string Name;
-			public CsType ReturnType;
-			public CsMethodParam[] Parameters;
-			public override string ToString() => $"{ReturnType} {Name}({string.Join(", ", Parameters)})";
-		}
-
-		private struct CsMethodParam
-		{
-			public string Name;
-			public CsType Type;
-			public override string ToString() => $"{Type} {Name}";
-		}
-
-		private struct IntelType
-		{
-			public string Name;
-			public string Hint;
-			public bool IsPointer;
-			public CsType CsType;
-			public string ToRenderString() => IsPointer ? $"{Name}*" : $"{Name}";
-			public override string ToString() => IsPointer ? $"{Name}* /* {Hint} */" : $"{Name} /* {Hint} */";
-		}
-
-		private struct IntelMethod
-		{
-			public string Name;
-			public IntelMethodParam Return;
-			public IntelMethodParam[] Parameters;
-			public string Description;
-			public string Instructions;
-			public string ToRenderString() => $"{Return.Type.ToRenderString()} {Name}({string.Join(", ", Parameters.Select(x => x.ToRenderString()))})";
-			public override string ToString() => $"{Return.Type} {Name}({string.Join(", ", Parameters)})";
-		}
-
-		private struct IntelMethodParam
-		{
-			public string Name;
-			public IntelType Type;
-			public string ToRenderString() => $"{Type.ToRenderString()} {Name}";
-			public override string ToString() => $"{Type} {Name}";
-		}
-	}
-}
\ No newline at end of file
diff --git a/src/External/RawIntrinsicsGenerator/Program.cs b/src/External/RawIntrinsicsGenerator/Program.cs
deleted file mode 100644
index 735c982..0000000
--- a/src/External/RawIntrinsicsGenerator/Program.cs
+++ /dev/null
@@ -1,16 +0,0 @@
-using System.Reflection;
-
-namespace RawIntrinsicsGenerator
-{
-    public static class Program
-	{
-		private async static Task Main(string[] _)
-		{
-			var savePath = Path.Combine(Path.GetDirectoryName(Assembly.GetExecutingAssembly().Location), "RawIntrinsics");
-			
-			await Generator.Generate("RawIntrinsics", savePath);
-			
-			Console.WriteLine($"Done! Generated files were saved to {savePath}");
-		}
-	}
-}
\ No newline at end of file
diff --git a/src/External/RawIntrinsicsGenerator/RawIntrinsicsGenerator.csproj b/src/External/RawIntrinsicsGenerator/RawIntrinsicsGenerator.csproj
deleted file mode 100644
index 3fb0ffa..0000000
--- a/src/External/RawIntrinsicsGenerator/RawIntrinsicsGenerator.csproj
+++ /dev/null
@@ -1,16 +0,0 @@
-<Project Sdk="Microsoft.NET.Sdk">
-
-    <PropertyGroup>
-        <TargetFramework>net7.0</TargetFramework>
-        <OutputType>Exe</OutputType>
-    </PropertyGroup>
-
-    <ItemGroup>
-        <PackageReference Include="Microsoft.CodeAnalysis.CSharp" Version="4.0.1" PrivateAssets="all" />
-    </ItemGroup>
-
-    <ItemGroup>
-        <ProjectReference Include="..\RawIntrinsics\RawIntrinsics.csproj" />
-    </ItemGroup>
-
-</Project>
diff --git a/src/Fast.PRNGs/Common.cs b/src/Fast.PRNGs/Common.cs
index d6c56c7..c501dc6 100644
--- a/src/Fast.PRNGs/Common.cs
+++ b/src/Fast.PRNGs/Common.cs
@@ -1,13 +1,41 @@
 using System.Runtime.CompilerServices;
+using System.Runtime.Intrinsics;
+using System.Runtime.Intrinsics.X86;
 
 namespace Fast.PRNGs;
 
 internal static class Common
 {
-    internal const ulong DoubleMask = (1L << 53) - 1;
-    internal const double Norm53 = 1.0d / (1L << 53);
-    internal const ulong FloatMask = (1L << 24) - 1;
-    internal const float Norm24 = 1.0f / (1L << 24);
+    // From http://prng.di.unimi.it/
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    internal static double ExtractDouble(ulong value) =>
+        (value >> 11) * (1.0 / (1ul << 53));
+
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    internal static float ExtractSingle(ulong value) =>
+        (value >> 40) * (1.0f / (1u << 24));
+
+    private static readonly Vector256<double> DoubleMultiplier256 = Vector256.Create(1.0 / (1ul << 53));
+    private static readonly Vector256<float> SingleMultiplier256 = Vector256.Create(1.0f / (1u << 24));
+    private static readonly Vector512<double> DoubleMultiplier512 = Vector512.Create(1.0 / (1ul << 53));
+    private static readonly Vector512<float> SingleMultiplier512 = Vector512.Create(1.0f / (1u << 24));
+
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    internal static void ExtractDoubles256(in Vector256<ulong> values, ref Vector256<double> result) =>
+        result = Avx2.Multiply(Vector256.ConvertToDouble(Avx2.ShiftRightLogical(values, 11)), DoubleMultiplier256);
+
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    internal static void ExtractSingles256(in Vector256<ulong> values, ref Vector256<float> result) =>
+        result = Avx2.Multiply(Vector256.ConvertToSingle(Avx2.ShiftRightLogical(values, 40).AsInt32()), SingleMultiplier256);
+
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    internal static void ExtractDoubles512(in Vector512<ulong> values, ref Vector512<double> result) =>
+        result = Avx512F.Multiply(Vector512.ConvertToDouble(Avx512F.ShiftRightLogical(values, 11)), DoubleMultiplier512);
+
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    internal static void ExtractSingles512(in Vector512<ulong> values, ref Vector512<float> result) =>
+        result = Avx512F.Multiply(Vector512.ConvertToSingle(Avx512F.ShiftRightLogical(values, 40).AsInt32()), SingleMultiplier512);
+
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
     internal static ulong Rotl(ulong x, int k)
diff --git a/src/Fast.PRNGs/Fast.PRNGs.csproj b/src/Fast.PRNGs/Fast.PRNGs.csproj
index dfd20ad..cb8e770 100644
--- a/src/Fast.PRNGs/Fast.PRNGs.csproj
+++ b/src/Fast.PRNGs/Fast.PRNGs.csproj
@@ -1,7 +1,7 @@
 <Project Sdk="Microsoft.NET.Sdk">
 
     <PropertyGroup>
-        <TargetFramework>net7.0</TargetFramework>
+        <TargetFramework>net8.0</TargetFramework>
         <AllowUnsafeBlocks>true</AllowUnsafeBlocks>
         <IsPackable>true</IsPackable>
 
@@ -32,8 +32,8 @@
         <PackageReference Include="InlineIL.Fody" Version="1.7.4" PrivateAssets="all" />
     </ItemGroup>
 
-    <ItemGroup>
+    <!--<ItemGroup>
         <Compile Include="..\External\RawIntrinsics\*.cs" />
-    </ItemGroup>
+    </ItemGroup>-->
 
 </Project>
diff --git a/src/Fast.PRNGs/MWC256.cs b/src/Fast.PRNGs/MWC256.cs
index adfa6cf..3b46235 100644
--- a/src/Fast.PRNGs/MWC256.cs
+++ b/src/Fast.PRNGs/MWC256.cs
@@ -76,14 +76,8 @@ public int Next()
     }
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
-    public double NextDouble()
-    {
-        return (NextInternal() & DoubleMask) * Norm53;
-    }
+    public double NextDouble() => ExtractDouble(NextInternal());
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
-    public float NextFloat()
-    {
-        return (NextInternal() & FloatMask) * Norm24;
-    }
+    public float NextFloat() => ExtractSingle(NextInternal());
 }
diff --git a/src/Fast.PRNGs/Shishua.cs b/src/Fast.PRNGs/Shishua.cs
index f2e71fd..343a270 100644
--- a/src/Fast.PRNGs/Shishua.cs
+++ b/src/Fast.PRNGs/Shishua.cs
@@ -1,12 +1,9 @@
 using System.Diagnostics;
 using System.Runtime.CompilerServices;
 using System.Runtime.InteropServices;
+using System.Runtime.Intrinsics;
 using System.Runtime.Intrinsics.X86;
-using RawIntrinsics;
-
 using static Fast.PRNGs.Common;
-using static RawIntrinsics.AVX;
-using static RawIntrinsics.AVX2;
 
 namespace Fast.PRNGs;
 
@@ -26,7 +23,7 @@ namespace Fast.PRNGs;
         0x626E33B8D04B4331, 0xBBF73C790D94F79D, 0x471C4AB3ED3D82A5, 0xFEC507705E4AE6E5,
     };
 
-    private const int BufferSize = 1 << 17;
+    private const int BufferSize = 1 << 18;
 
     private readonly nuint _state;
 
@@ -101,23 +98,61 @@ private ulong NextInternal()
     }
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
-    public int Next()
+    private ref Vector256<ulong> NextInternalVec256()
     {
-        return (int)(NextInternal() >> 32);
+        const int size = sizeof(ulong) * 4;
+
+        ref var bufferedState = ref this.State;
+        if (bufferedState.BufferIndex >= BufferSize || BufferSize - bufferedState.BufferIndex < size)
+        {
+            FillBuffer(ref bufferedState);
+        }
+
+        ref var value = ref Unsafe.As<byte, Vector256<ulong>>(ref bufferedState.Buffer[bufferedState.BufferIndex]);
+        bufferedState.BufferIndex += size;
+        return ref value;
     }
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
-    public double NextDouble()
+    private ref Vector512<ulong> NextInternalVec512()
     {
-        return (NextInternal() & DoubleMask) * Norm53;
+        const int size = sizeof(ulong) * 8;
+
+        ref var bufferedState = ref this.State;
+        if (bufferedState.BufferIndex >= BufferSize || BufferSize - bufferedState.BufferIndex < size)
+        {
+            FillBuffer(ref bufferedState);
+        }
+
+        ref var value = ref Unsafe.As<byte, Vector512<ulong>>(ref bufferedState.Buffer[bufferedState.BufferIndex]);
+        bufferedState.BufferIndex += size;
+        return ref value;
     }
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
-    public float NextFloat()
+    public int Next()
     {
-        return (NextInternal() & FloatMask) * Norm24;
+        return (int)(NextInternal() >> 32);
     }
 
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    public double NextDouble() => ExtractDouble(NextInternal());
+
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    public void NextDoubles256(ref Vector256<double> result) => ExtractDoubles256(NextInternalVec256(), ref result);
+
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    public void NextDoubles512(ref Vector512<double> result) => ExtractDoubles512(NextInternalVec512(), ref result);
+
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    public float NextFloat() => ExtractSingle(NextInternal());
+
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    public void NextFloats256(ref Vector256<float> result) => ExtractSingles256(NextInternalVec256(), ref result);
+
+    [MethodImpl(MethodImplOptions.AggressiveInlining)]
+    public void NextFloats512(ref Vector512<float> result) => ExtractSingles512(NextInternalVec512(), ref result);
+
     public void Dispose()
     {
         FreeState();
@@ -142,10 +177,10 @@ private void InitState(ref RawState state, ref Seed seed)
 
         Span<byte> buf = stackalloc byte[128 * steps];
 
-        state.State[0] = _mm256_setr_epi64x((long)(Phi[0] ^ seed[0]), (long)(Phi[1]), (long)(Phi[2] ^ seed[1]), (long)(Phi[3]));
-        state.State[1] = _mm256_setr_epi64x((long)(Phi[4] ^ seed[2]), (long)(Phi[5]), (long)(Phi[6] ^ seed[3]), (long)(Phi[7]));
-        state.State[2] = _mm256_setr_epi64x((long)(Phi[8] ^ seed[2]), (long)(Phi[9]), (long)(Phi[10] ^ seed[3]), (long)(Phi[11]));
-        state.State[3] = _mm256_setr_epi64x((long)(Phi[12] ^ seed[0]), (long)(Phi[13]), (long)(Phi[14] ^ seed[1]), (long)(Phi[15]));
+        state.State[0] = Vector256.Create((ulong)(Phi[0] ^ seed[0]), (ulong)(Phi[1]), (ulong)(Phi[2] ^ seed[1]), (ulong)(Phi[3]));
+        state.State[1] = Vector256.Create((ulong)(Phi[4] ^ seed[2]), (ulong)(Phi[5]), (ulong)(Phi[6] ^ seed[3]), (ulong)(Phi[7]));
+        state.State[2] = Vector256.Create((ulong)(Phi[8] ^ seed[2]), (ulong)(Phi[9]), (ulong)(Phi[10] ^ seed[3]), (ulong)(Phi[11]));
+        state.State[3] = Vector256.Create((ulong)(Phi[12] ^ seed[0]), (ulong)(Phi[13]), (ulong)(Phi[14] ^ seed[1]), (ulong)(Phi[15]));
 
         for (int i = 0; i < rounds; i++)
         {
@@ -155,6 +190,7 @@ private void InitState(ref RawState state, ref Seed seed)
         }
     }
 
+    [MethodImpl(MethodImplOptions.NoInlining)]
     private void FillBuffer(ref BufferedState bufferedState)
     {
         PrngGen(ref bufferedState.State, bufferedState.Buffer);
@@ -165,17 +201,17 @@ unsafe private void PrngGen(ref RawState state, Span<byte> buffer)
     {
         var size = buffer.Length;
 
-        __m256i
+        Vector256<ulong>
             o0 = state.Output[0], o1 = state.Output[1],
             o2 = state.Output[2], o3 = state.Output[3],
             s0 = state.State[0], s1 = state.State[1],
             s2 = state.State[2], s3 = state.State[3],
             t0, t1, t2, t3, u0, u1, u2, u3, counter = state.Counter;
 
-        __m256i shu0 = _mm256_setr_epi32(5, 6, 7, 0, 1, 2, 3, 4),
-                shu1 = _mm256_setr_epi32(3, 4, 5, 6, 7, 0, 1 ,2);
+        Vector256<uint> shu0 = Vector256.Create(5u, 6u, 7u, 0u, 1u, 2u, 3u, 4u),
+                shu1 = Vector256.Create(3u, 4u, 5u, 6u, 7u, 0u, 1u, 2u);
 
-        __m256i increment = _mm256_setr_epi64x(7, 5, 3, 1);
+        Vector256<ulong> increment = Vector256.Create(7UL, 5UL, 3UL, 1UL);
 
         Debug.Assert(size % 128 == 0, "buf's size must be a multiple of 128 bytes");
 
@@ -183,28 +219,28 @@ unsafe private void PrngGen(ref RawState state, Span<byte> buffer)
         {
             if (!buffer.IsEmpty)
             {
-                _mm256_storeu_si256((__m256i*)Unsafe.AsPointer(ref buffer[i + 0]), o0);
-                _mm256_storeu_si256((__m256i*)Unsafe.AsPointer(ref buffer[i + 32]), o1);
-                _mm256_storeu_si256((__m256i*)Unsafe.AsPointer(ref buffer[i + 64]), o2);
-                _mm256_storeu_si256((__m256i*)Unsafe.AsPointer(ref buffer[i + 96]), o3);
+                Avx.Store((ulong*)Unsafe.AsPointer(ref buffer[i + 0]), o0);
+                Avx.Store((ulong*)Unsafe.AsPointer(ref buffer[i + 32]), o0);
+                Avx.Store((ulong*)Unsafe.AsPointer(ref buffer[i + 64]), o0);
+                Avx.Store((ulong*)Unsafe.AsPointer(ref buffer[i + 96]), o0);
             }
 
-            s1 = _mm256_add_epi64(s1, counter);
-            s3 = _mm256_add_epi64(s3, counter);
-            counter = _mm256_add_epi64(counter, increment);
+            s1 = Avx2.Add(s1, counter);
+            s3 = Avx2.Add(s3, counter);
+            counter = Avx2.Add(counter, increment);
 
-            u0 = _mm256_srli_epi64(s0, 1); u1 = _mm256_srli_epi64(s1, 3);
-            u2 = _mm256_srli_epi64(s2, 1); u3 = _mm256_srli_epi64(s3, 3);
-            t0 = _mm256_permutevar8x32_epi32(s0, shu0); t1 = _mm256_permutevar8x32_epi32(s1, shu1);
-            t2 = _mm256_permutevar8x32_epi32(s2, shu0); t3 = _mm256_permutevar8x32_epi32(s3, shu1);
+            u0 = Avx2.ShiftRightLogical(s0, 1); u1 = Avx2.ShiftRightLogical(s1, 3);
+            u2 = Avx2.ShiftRightLogical(s2, 1); u3 = Avx2.ShiftRightLogical(s3, 3);
+            t0 = Avx2.PermuteVar8x32(s0.AsUInt32(), shu0).AsUInt64(); t1 = Avx2.PermuteVar8x32(s1.AsUInt32(), shu1).AsUInt64();
+            t2 = Avx2.PermuteVar8x32(s2.AsUInt32(), shu0).AsUInt64(); t3 = Avx2.PermuteVar8x32(s3.AsUInt32(), shu1).AsUInt64();
 
-            s0 = _mm256_add_epi64(t0, u0); s1 = _mm256_add_epi64(t1, u1);
-            s2 = _mm256_add_epi64(t2, u2); s3 = _mm256_add_epi64(t3, u3);
+            s0 = Avx2.Add(t0, u0); s1 = Avx2.Add(t1, u1);
+            s2 = Avx2.Add(t2, u2); s3 = Avx2.Add(t3, u3);
 
-            o0 = _mm256_xor_si256(u0, t1);
-            o1 = _mm256_xor_si256(u2, t3);
-            o2 = _mm256_xor_si256(s0, s3);
-            o3 = _mm256_xor_si256(s2, s1);
+            o0 = Avx2.Xor(u0, t1);
+            o1 = Avx2.Xor(u2, t3);
+            o2 = Avx2.Xor(s0, s3);
+            o3 = Avx2.Xor(s2, s1);
         }
 
         state.Output[0] = o0; state.Output[1] = o1; state.Output[2] = o2; state.Output[3] = o3;
@@ -230,20 +266,20 @@ unsafe private struct BufferedState
     [StructLayout(LayoutKind.Sequential)]
     private struct RawState
     {
-        private __m256i _state00;
-        private __m256i _state01;
-        private __m256i _state02;
-        private __m256i _state03;
-        public Span<__m256i> State => MemoryMarshal.CreateSpan(ref _state00, 4);
+        private Vector256<ulong> _state00;
+        private Vector256<ulong> _state01;
+        private Vector256<ulong> _state02;
+        private Vector256<ulong> _state03;
+        public Span<Vector256<ulong>> State => MemoryMarshal.CreateSpan(ref _state00, 4);
 
 
-        private __m256i _output00;
-        private __m256i _output01;
-        private __m256i _output02;
-        private __m256i _output03;
-        public Span<__m256i> Output => MemoryMarshal.CreateSpan(ref _output00, 4);
+        private Vector256<ulong> _output00;
+        private Vector256<ulong> _output01;
+        private Vector256<ulong> _output02;
+        private Vector256<ulong> _output03;
+        public Span<Vector256<ulong>> Output => MemoryMarshal.CreateSpan(ref _output00, 4);
 
-        public __m256i Counter;
+        public Vector256<ulong> Counter;
     }
 
     [StructLayout(LayoutKind.Sequential)]
diff --git a/src/Fast.PRNGs/Splitmix64.cs b/src/Fast.PRNGs/Splitmix64.cs
index 73c8fba..a30c50b 100644
--- a/src/Fast.PRNGs/Splitmix64.cs
+++ b/src/Fast.PRNGs/Splitmix64.cs
@@ -28,14 +28,8 @@ public ulong Next()
     }
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
-    public double NextDouble()
-    {
-        return (Next() & DoubleMask) * Norm53;
-    }
+    public double NextDouble() => ExtractDouble(Next());
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
-    public float NextFloat()
-    {
-        return (Next() & FloatMask) * Norm24;
-    }
+    public float NextFloat() => ExtractSingle(Next());
 }
diff --git a/src/Fast.PRNGs/Xoroshiro128Plus.cs b/src/Fast.PRNGs/Xoroshiro128Plus.cs
index 2537628..b957cf3 100644
--- a/src/Fast.PRNGs/Xoroshiro128Plus.cs
+++ b/src/Fast.PRNGs/Xoroshiro128Plus.cs
@@ -1,4 +1,3 @@
-using System;
 using System.Runtime.CompilerServices;
 using System.Runtime.InteropServices;
 using static Fast.PRNGs.Common;
@@ -50,14 +49,8 @@ public int Next()
     }
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
-    public double NextDouble()
-    {
-        return (NextInternal() & DoubleMask) * Norm53;
-    }
+    public double NextDouble() => ExtractDouble(NextInternal());
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
-    public float NextFloat()
-    {
-        return (NextInternal() & FloatMask) * Norm24;
-    }
+    public float NextFloat() => ExtractSingle(NextInternal());
 }
diff --git a/src/Fast.PRNGs/Xoshiro256Plus.cs b/src/Fast.PRNGs/Xoshiro256Plus.cs
index ebe390e..c508a5e 100644
--- a/src/Fast.PRNGs/Xoshiro256Plus.cs
+++ b/src/Fast.PRNGs/Xoshiro256Plus.cs
@@ -80,14 +80,8 @@ public int Next()
     }
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
-    public double NextDouble()
-    {
-        return (NextInternal() & DoubleMask) * Norm53;
-    }
+    public double NextDouble() => ExtractDouble(NextInternal());
 
     [MethodImpl(MethodImplOptions.AggressiveInlining)]
-    public float NextFloat()
-    {
-        return (NextInternal() & FloatMask) * Norm24;
-    }
+    public float NextFloat() => ExtractSingle(NextInternal());
 }
diff --git a/test/Fast.PRNGs.Tests/Fast.PRNGs.Tests.csproj b/test/Fast.PRNGs.Tests/Fast.PRNGs.Tests.csproj
index dc3bd16..a35bfaa 100644
--- a/test/Fast.PRNGs.Tests/Fast.PRNGs.Tests.csproj
+++ b/test/Fast.PRNGs.Tests/Fast.PRNGs.Tests.csproj
@@ -1,7 +1,7 @@
 <Project Sdk="Microsoft.NET.Sdk">
 
     <PropertyGroup>
-        <TargetFramework>net7.0</TargetFramework>
+        <TargetFramework>net8.0</TargetFramework>
     </PropertyGroup>
 
     <ItemGroup>
diff --git a/test/Fast.PRNGs.Tests/ShishuaTests.cs b/test/Fast.PRNGs.Tests/ShishuaTests.cs
index 6e7d552..a921bcb 100644
--- a/test/Fast.PRNGs.Tests/ShishuaTests.cs
+++ b/test/Fast.PRNGs.Tests/ShishuaTests.cs
@@ -1,7 +1,8 @@
-﻿using Accord.Statistics.Distributions.Univariate;
+using Accord.Statistics.Distributions.Univariate;
 using Accord.Statistics.Testing;
 using Plotly.NET.CSharp;
 using System.Runtime.CompilerServices;
+using System.Runtime.Intrinsics;
 
 namespace Fast.PRNGs.Tests;
 
@@ -68,6 +69,24 @@ public void InitFromNew()
         using var _ = Shishua.Create(new Random());
     }
 
+    public void Compare()
+    {
+        if (!Shishua.IsSupported)
+            return;
+
+        using var rng1 = Shishua.Create(new Random(0));
+        using var rng2 = Shishua.Create(new Random(0));
+        using var rng3 = Shishua.Create(new Random(0));
+
+        Vector256<double> vec256 = default;
+
+        var val1 = rng1.NextDouble();
+        rng2.NextDoubles256(ref vec256);
+        //var val3 = rng3.NextDoubles512()[0];
+        Assert.True(Math.Abs(vec256[0] - val1) < 0.0001d);
+        //Assert.True(Math.Abs(val3 - val1) < 0.0001d);
+    }
+
     public void InitFromBytes()
     {
         if (!Shishua.IsSupported)