source code
/* The Computer Language Benchmarks Game
https://salsa.debian.org/benchmarksgame-team/benchmarksgame/
contributed by Jesper Meyer
*/
using System;
using System.Runtime.CompilerServices;
using System.Runtime.Intrinsics;
using System.Runtime.Intrinsics.X86;
using System.Threading.Tasks;
namespace SpectralNorm
{
unsafe class Program
{
public static void Main(string[] args)
{
int n = 100;
if (args.Length > 0) n = int.Parse(args[0]);
fixed (double* u = new double[n])
fixed (double* v = new double[n])
{
new Span<double>(u, n).Fill(1);
for (var i = 0; i < 10; i++)
{
mult_AtAv(u, v, n);
mult_AtAv(v, u, n);
}
var result = Math.Sqrt(dot(u, v, n) / dot(v, v, n));
Console.WriteLine("{0:f9}", result);
}
}
[MethodImpl(MethodImplOptions.AggressiveInlining)]
private static double A(int i, int j)
{
return (i + j) * (i + j + 1) / 2 + i + 1;
}
private static double dot(double* v, double* u, int n)
{
double sum = 0;
for (var i = 0; i < n; i++)
sum += v[i] * u[i];
return sum;
}
[MethodImpl(MethodImplOptions.AggressiveOptimization)]
private static void mult_Av(double* v, double* outv, int n)
{
Parallel.For(0, n, i =>
{
var sum = Vector128<double>.Zero;
for (var j = 0; j < n; j += 2)
{
var b = Sse2.LoadVector128(v + j);
var a = Vector128.Create(A(i, j), A(i, j + 1));
sum = Sse2.Add(sum, Sse2.Divide(b, a));
}
var add = Sse3.HorizontalAdd(sum, sum);
var value = Unsafe.As<Vector128<double>, double>(ref add);
Unsafe.WriteUnaligned(outv + i, value);
});
}
[MethodImpl(MethodImplOptions.AggressiveOptimization)]
private static void mult_Atv(double* v, double* outv, int n)
{
Parallel.For(0, n, i =>
{
var sum = Vector128<double>.Zero;
for (var j = 0; j < n; j += 2)
{
var b = Sse2.LoadVector128(v + j);
var a = Vector128.Create(A(j, i), A(j + 1, i));
sum = Sse2.Add(sum, Sse2.Divide(b, a));
}
var add = Sse3.HorizontalAdd(sum, sum);
var value = Unsafe.As<Vector128<double>, double>(ref add);
Unsafe.WriteUnaligned(outv + i, value);
});
}
private static void mult_AtAv(double* v, double* outv, int n)
{
fixed (double* tmp = new double[n])
{
mult_Av(v, tmp, n);
mult_Atv(tmp, outv, n);
}
}
}
}
notes, command-line, and program output
NOTES:
64-bit Ubuntu quad core
.NET SDK 9.0.100
Host Version: 9.0.0
Commit: 9d5a6a9aa4
<OutputType>Exe
<TargetFramework>net9.0
<ImplicitUsings>enable
<Nullable>enable
<AllowUnsafeBlocks>true
<ServerGarbageCollection>true
<ConcurrentGarbageCollection>true
<PublishAot>true
<OptimizationPreference>Speed
<IlcInstructionSet>native
Thu, 14 Nov 2024 01:31:40 GMT
MAKE:
cp spectralnorm.csharpaot-5.csharpaot Program.cs
cp Include/csharpaot/program.csproj .
mkdir obj
cp Include/csharpaot/project.assets.json ./obj
/opt/src/dotnet-sdk-9.0.100/dotnet publish
Determining projects to restore...
Restored /home/dunham/all-benchmarksgame/benchmarksgame_i53330/spectralnorm/tmp/program.csproj (in 943 ms).
program -> /home/dunham/all-benchmarksgame/benchmarksgame_i53330/spectralnorm/tmp/bin/Release/net9.0/linux-x64/program.dll
Generating native code
program -> /home/dunham/all-benchmarksgame/benchmarksgame_i53330/spectralnorm/tmp/bin/Release/net9.0/linux-x64/publish/
25.31s to complete and log all make actions
COMMAND LINE:
./bin/Release/net9.0/linux-x64/native/program 5500
PROGRAM OUTPUT:
1.274224153