Files
Misaki.HighPerformance/Misaki.HighPerformance.Mathematics.SPMD/IJobSPMD.cs
2026-02-21 17:20:51 +09:00

145 lines
5.0 KiB
C#

using Misaki.HighPerformance.Jobs;
using System.Numerics;
namespace Misaki.HighPerformance.Mathematics.SPMD;
public interface IJobSPMD<TNumber>
where TNumber : unmanaged, INumber<TNumber>, IBinaryNumber<TNumber>, IMinMaxValue<TNumber>, IBitwiseOperators<TNumber, TNumber, TNumber>
{
void Execute<TLane>(int baseIndex, int threadIndex)
where TLane : ISPMD<TLane, TNumber>;
}
internal struct SPMDJobWrapper<T, TNumber> : IJobParallelFor
where T : unmanaged, IJobSPMD<TNumber>
where TNumber : unmanaged, INumber<TNumber>, IBinaryNumber<TNumber>, IMinMaxValue<TNumber>, IBitwiseOperators<TNumber, TNumber, TNumber>
{
public T innerJob;
public int totalCount;
public void Execute(int loopIndex, int threadIndex)
{
var baseIndex = loopIndex * WideLane<TNumber>.LaneWidth;
var remaining = totalCount - baseIndex;
if (remaining >= WideLane<TNumber>.LaneWidth)
{
innerJob.Execute<WideLane<TNumber>>(baseIndex, threadIndex);
}
else
{
for (var j = 0; j < remaining; j++)
{
innerJob.Execute<ScalarLane<TNumber>>(baseIndex + j, threadIndex);
}
}
}
//public void Execute(int startIndex, int endIndex, int threadIndex)
//{
// for (int i = startIndex; i < endIndex; i++)
// {
// var baseIndex = i * WideLane<TNumber>.LaneWidth;
// var remaining = totalCount - baseIndex;
// if (remaining >= WideLane<TNumber>.LaneWidth)
// {
// innerJob.Execute<WideLane<TNumber>>(baseIndex, threadIndex);
// }
// else
// {
// for (var j = 0; j < remaining; j++)
// {
// innerJob.Execute<ScalarLane<TNumber>>(baseIndex + j, threadIndex);
// }
// }
// }
//}
}
internal struct SPMDScalerJobWrapper<T, TNumber> : IJobParallelFor
where T : unmanaged, IJobSPMD<TNumber>
where TNumber : unmanaged, INumber<TNumber>, IBinaryNumber<TNumber>, IMinMaxValue<TNumber>, IBitwiseOperators<TNumber, TNumber, TNumber>
{
public T innerJob;
public int totalCount;
public void Execute(int loopIndex, int threadIndex)
{
innerJob.Execute<ScalarLane<TNumber>>(loopIndex, threadIndex);
}
//[MethodImpl(MethodImplOptions.AggressiveInlining)]
//public void Execute(int startIndex, int endIndex, int threadIndex)
//{
// for (int i = startIndex; i < endIndex; i++)
// {
// innerJob.Execute<ScalarLane<TNumber>>(i, threadIndex);
// }
//}
}
public static class IJobParallelForSPMDExtensions
{
public static void Run<T, TNumber>(this ref T job, int totalCount, int threadIndex)
where T : struct, IJobSPMD<TNumber>
where TNumber : unmanaged, INumber<TNumber>, IBinaryNumber<TNumber>, IMinMaxValue<TNumber>, IBitwiseOperators<TNumber, TNumber, TNumber>
{
if (WideLane.IsSupported)
{
var iterations = (totalCount + WideLane<TNumber>.LaneWidth - 1) / WideLane<TNumber>.LaneWidth;
for (var loopIndex = 0; loopIndex < iterations; loopIndex++)
{
var baseIndex = loopIndex * WideLane<TNumber>.LaneWidth;
var remaining = totalCount - baseIndex;
if (remaining >= WideLane<TNumber>.LaneWidth)
{
job.Execute<WideLane<TNumber>>(baseIndex, threadIndex);
}
else
{
for (var i = 0; i < remaining; i++)
{
job.Execute<ScalarLane<TNumber>>(baseIndex + i, threadIndex);
}
}
}
}
else
{
for (var loopIndex = 0; loopIndex < totalCount; loopIndex++)
{
job.Execute<ScalarLane<TNumber>>(loopIndex, threadIndex);
}
}
}
public static JobHandle ScheduleParallelSPDM<T, TNumber>(this JobScheduler jobScheduler, ref T job, int totalCount, int batchSize, int threadIndex, JobHandle dependency)
where T : unmanaged, IJobSPMD<TNumber>
where TNumber : unmanaged, INumber<TNumber>, IBinaryNumber<TNumber>, IMinMaxValue<TNumber>, IBitwiseOperators<TNumber, TNumber, TNumber>
{
if (WideLane.IsSupported)
{
var warper = new SPMDJobWrapper<T, TNumber>
{
innerJob = job,
totalCount = totalCount,
};
var iterations = (totalCount + WideLane<TNumber>.LaneWidth - 1) / WideLane<TNumber>.LaneWidth;
return jobScheduler.ScheduleParallelFor(ref warper, iterations, batchSize, threadIndex, dependency);
}
else
{
var warper = new SPMDScalerJobWrapper<T, TNumber>
{
innerJob = job,
totalCount = totalCount,
};
return jobScheduler.ScheduleParallelFor(ref warper, totalCount, batchSize, threadIndex, dependency);
}
}
}