Add UseGpu property to ModelConfiguration and update network runtime configuration

This commit is contained in:
MaddoScientisto 2026-05-09 17:29:56 +02:00
commit f4f8a58646
3 changed files with 50 additions and 30 deletions

View file

@ -139,6 +139,12 @@
must match the class ordering used by the trained recognition network.
</summary>
</member>
<member name="P:AIFotoONLUS.Core.ModelConfiguration.UseGpu">
<summary>
When enabled, request OpenCV DNN CUDA backend/target for inference.
The installed OpenCV runtime must have CUDA support or model loading/forwarding may fail.
</summary>
</member>
<member name="P:AIFotoONLUS.Core.ModelConfiguration.EnableCropSaving">
<summary>
When enabled, recognition crops will be saved to disk under

View file

@ -55,6 +55,12 @@ namespace AIFotoONLUS.Core
/// </summary>
public string[] NumberClasses { get; set; } = new[] { "0", "1", "2", "3", "4", "5", "6", "7", "8", "9" };
/// <summary>
/// When enabled, request OpenCV DNN CUDA backend/target for inference.
/// The installed OpenCV runtime must have CUDA support or model loading/forwarding may fail.
/// </summary>
public bool UseGpu { get; set; } = false;
/// <summary>
/// When enabled, recognition crops will be saved to disk under
/// "logs/crops" for diagnostic inspection. Disabled by default.

View file

@ -95,10 +95,8 @@ namespace AIFotoONLUS.Core
_detectionNet = CvDnn.ReadNetFromDarknet(_cfg.DetectionCfg, _cfg.DetectionWeights);
_recognitionNet = CvDnn.ReadNetFromDarknet(_cfg.RecognitionCfg, _cfg.RecognitionWeights);
_detectionNet.SetPreferableBackend(Backend.OPENCV);
_detectionNet.SetPreferableTarget(Target.CPU);
_recognitionNet.SetPreferableBackend(Backend.OPENCV);
_recognitionNet.SetPreferableTarget(Target.CPU);
ConfigureNetRuntime(_detectionNet, _cfg.UseGpu);
ConfigureNetRuntime(_recognitionNet, _cfg.UseGpu);
// Let OpenCV use multiple threads internally (use number of logical processors)
try
{
@ -127,6 +125,19 @@ namespace AIFotoONLUS.Core
private string[] GetOutputLayerNames(Net net) => net.GetUnconnectedOutLayersNames();
private static void ConfigureNetRuntime(Net net, bool useGpu)
{
if (useGpu)
{
net.SetPreferableBackend(Backend.CUDA);
net.SetPreferableTarget(Target.CUDA);
return;
}
net.SetPreferableBackend(Backend.OPENCV);
net.SetPreferableTarget(Target.CPU);
}
/// <summary>
/// Detect text regions in the supplied image using the detection network.
/// </summary>
@ -152,7 +163,7 @@ namespace AIFotoONLUS.Core
var outNames = GetOutputLayerNames(detectionNet);
var outsList = new List<Mat>();
detectionNet.Forward(outsList, outNames);
Mat[] outs = outsList.ToArray();
if (outs.Length == 0)
{
@ -162,15 +173,15 @@ namespace AIFotoONLUS.Core
var fallback = new List<Mat>();
for (int on = 0; on < outNames.Length; on++)
{
try
{
var single = detectionNet.Forward(outNames[on]);
fallback.Add(single);
}
catch (Exception ex)
{
_logger?.LogError(ex, "Fallback Forward failed for {name}", outNames[on]);
}
try
{
var single = detectionNet.Forward(outNames[on]);
fallback.Add(single);
}
catch (Exception ex)
{
_logger?.LogError(ex, "Fallback Forward failed for {name}", outNames[on]);
}
}
if (fallback.Count > 0)
{
@ -221,21 +232,21 @@ namespace AIFotoONLUS.Core
}
if (maxScore > _cfg.ConfidenceThreshold)
{
int x = (int)Math.Max(0, Math.Round(cx - w / 2));
int y = (int)Math.Max(0, Math.Round(cy - h / 2));
var rect = new Rect(x, y, (int)Math.Round(w), (int)Math.Round(h));
boxes.Add(rect);
confidences.Add(maxScore);
classIds.Add(bestClass);
centerXList.Add(cx);
}
{
int x = (int)Math.Max(0, Math.Round(cx - w / 2));
int y = (int)Math.Max(0, Math.Round(cy - h / 2));
var rect = new Rect(x, y, (int)Math.Round(w), (int)Math.Round(h));
boxes.Add(rect);
confidences.Add(maxScore);
classIds.Add(bestClass);
centerXList.Add(cx);
}
}
}
if (boxes.Count == 0) return Enumerable.Empty<DetectedRegion>();
CvDnn.NMSBoxes(boxes, confidences, (float)_cfg.ConfidenceThreshold, (float)_cfg.NmsThreshold, out int[] indices);
@ -486,10 +497,8 @@ namespace AIFotoONLUS.Core
{
var det = CvDnn.ReadNetFromDarknet(_cfg.DetectionCfg, _cfg.DetectionWeights);
var rec = CvDnn.ReadNetFromDarknet(_cfg.RecognitionCfg, _cfg.RecognitionWeights);
det.SetPreferableBackend(Backend.OPENCV);
det.SetPreferableTarget(Target.CPU);
rec.SetPreferableBackend(Backend.OPENCV);
rec.SetPreferableTarget(Target.CPU);
ConfigureNetRuntime(det, _cfg.UseGpu);
ConfigureNetRuntime(rec, _cfg.UseGpu);
netsBag.Add((det, rec));
return (det, rec);
});
@ -525,8 +534,7 @@ namespace AIFotoONLUS.Core
try
{
using var tempRec = CvDnn.ReadNetFromDarknet(_cfg.RecognitionCfg, _cfg.RecognitionWeights);
tempRec.SetPreferableBackend(Backend.OPENCV);
tempRec.SetPreferableTarget(Target.CPU);
ConfigureNetRuntime(tempRec, _cfg.UseGpu);
var alt = RecognizeDigits(crop, tempRec, ctx);
if (!string.IsNullOrEmpty(alt)) txt = alt;
}