Search code examples
c#uwpazure-cognitive-servicesface-api

How to detect face attributes using Microsoft Cognitive service by providing Windows.Media.FaceAnalysis DetectedFace list?


I am able to get faces from Live Web Cam as a list of Windows.Media.FaceAnalysis DetectedFace objects. Now I would like to pass these faces to Microsoft Cognitive Services API to detect faces and get the face attributes. How can I do this?

IList<DetectedFace> faces = null;

// Create a VideoFrame object specifying the pixel format we want our capture image to be (NV12 bitmap in this case).
// GetPreviewFrame will convert the native webcam frame into this format.
const BitmapPixelFormat InputPixelFormat = BitmapPixelFormat.Nv12;
using (VideoFrame previewFrame = new VideoFrame(InputPixelFormat, (int)this.videoProperties.Width, (int)this.videoProperties.Height))
{
    await this.mediaCapture.GetPreviewFrameAsync(previewFrame);

    // The returned VideoFrame should be in the supported NV12 format but we need to verify this.
    if (FaceDetector.IsBitmapPixelFormatSupported(previewFrame.SoftwareBitmap.BitmapPixelFormat))
    {
        faces = await this.faceDetector.DetectFacesAsync(previewFrame.SoftwareBitmap);

        // Now pass this faces to Cognitive services API
        // faceClient.DetectAsync
    }
}

Solution

  • The DetectedFace object contains the bounding box of the actual face. So you can use this knowledge to create an in-memory stream of the face and send it over to the Face Client.

    private async Task DetectAsync()
    {
        IList<DetectedFace> faces = null;
        const BitmapPixelFormat InputPixelFormat = BitmapPixelFormat.Nv12;
        using (VideoFrame destinationPreviewFrame = new VideoFrame(InputPixelFormat, 640, 480))
        {
            await this._mediaCapture.GetPreviewFrameAsync(destinationPreviewFrame);
    
            if (FaceDetector.IsBitmapPixelFormatSupported(InputPixelFormat))
            {
                faces = await this.faceDetector.DetectFacesAsync(destinationPreviewFrame.SoftwareBitmap);
    
                foreach (var face in faces)
                {
                    // convert NV12 to RGBA16 format
                    SoftwareBitmap convertedBitmap = SoftwareBitmap.Convert(destinationPreviewFrame.SoftwareBitmap, BitmapPixelFormat.Rgba16);
    
                    // get the raw bytes of the detected face
                    byte[] rawBytes = await GetBytesFromBitmap(convertedBitmap, BitmapEncoder.BmpEncoderId, face.FaceBox);
    
                    // read the bitmap and send it to the face client
                    using (Stream stream = rawBytes.AsBuffer().AsStream())
                    {
                        var faceAttributesToReturn = new List<FaceAttributeType>()
                        {
                            FaceAttributeType.Age,
                            FaceAttributeType.Emotion,
                            FaceAttributeType.Hair
                        };
    
                        Face[] detectedFaces = await this.faceClient.DetectAsync(stream, true, true, faceAttributesToReturn);
    
                        Debug.Assert(detectedFaces.Length > 0);
                    }
                }
            }
        }
    }
    
    private async Task<byte[]> GetBytesFromBitmap(SoftwareBitmap soft, Guid encoderId, BitmapBounds bounds)
    {
        byte[] array = null;
    
        using (var ms = new InMemoryRandomAccessStream())
        {
            BitmapEncoder encoder = await BitmapEncoder.CreateAsync(encoderId, ms);
            encoder.SetSoftwareBitmap(soft);
    
            // apply the bounds of the face
            encoder.BitmapTransform.Bounds = bounds;
    
            await encoder.FlushAsync();
    
            array = new byte[ms.Size];
    
            await ms.ReadAsync(array.AsBuffer(), (uint)ms.Size, InputStreamOptions.None);
        }
    
        return array;
    }