Use OpenSeeFace to control Live2D model

[facial-landmarks-for-cubism.git] / src / facial_landmark_detector.cpp
diff --git a/src/facial_landmark_detector.cpp b/src/facial_landmark_detector.cpp

index 20ec7c8..b953240 100644 (file)
--- a/src/facial_landmark_detector.cpp
+++ b/src/facial_landmark_detector.cpp
@@ -1,5 +1,5 @@
  /****
-Copyright (c) 2020 Adrian I. Lam
+Copyright (c) 2020-2021 Adrian I. Lam
  
  Permission is hereby granted, free of charge, to any person obtaining a copy
  of this software and associated documentation files (the "Software"), to deal
@@ -26,12 +26,11 @@ SOFTWARE.
  #include <sstream>
  #include <cmath>
  
-#include <opencv2/opencv.hpp>
-
-#include <dlib/opencv.h>
-#include <dlib/image_processing/frontal_face_detector.h>
-#include <dlib/image_processing.h>
-#include <dlib/image_processing/render_face_detections.h>
+#include <cinttypes>
+#include <sys/types.h>
+#include <sys/socket.h>
+#include <arpa/inet.h>
+#include <unistd.h>
  
  #include "facial_landmark_detector.h"
  #include "math_utils.h"
@@ -52,13 +51,27 @@ FacialLandmarkDetector::FacialLandmarkDetector(std::string cfgPath)
  {
      parseConfig(cfgPath);
  
-    if (!webcam.open(m_cfg.cvVideoCaptureId))
+    struct sockaddr_in addr;
+    addr.sin_family = AF_INET;
+    addr.sin_port = htons(m_cfg.osfPort);
+    addr.sin_addr.s_addr = inet_addr(m_cfg.osfIpAddress.c_str());
+
+    m_sock = socket(AF_INET, SOCK_DGRAM, IPPROTO_UDP);
+    if (m_sock < 0)
+    {
+        throw std::runtime_error("Cannot create UDP socket");
+    }
+
+    int ret = bind(m_sock, (struct sockaddr *)&addr, sizeof addr);
+    if (ret != 0)
      {
-        throw std::runtime_error("Unable to open webcam");
+        throw std::runtime_error("Cannot bind socket");
      }
+}
  
-    detector = dlib::get_frontal_face_detector();
-    dlib::deserialize(m_cfg.predictorPath) >> predictor;
+FacialLandmarkDetector::~FacialLandmarkDetector()
+{
+    close(m_sock);
  }
  
  FacialLandmarkDetector::Params FacialLandmarkDetector::getParams(void) const
@@ -74,26 +87,34 @@ FacialLandmarkDetector::Params FacialLandmarkDetector::getParams(void) const
  
      double leftEye = avg(m_leftEyeOpenness, 1);
      double rightEye = avg(m_rightEyeOpenness, 1);
-    // Just combine the two to get better synchronized blinks
-    // This effectively disables winks, so if we want to
-    // support winks in the future (see below) we will need
-    // a better way to handle this out-of-sync blinks.
-    double bothEyes = (leftEye + rightEye) / 2;
-    leftEye = bothEyes;
-    rightEye = bothEyes;
-    // Detect winks and make them look better
-    // Commenting out - winks are difficult to be detected by the
-    // dlib data set anyway... maybe in the future we can
-    // add a runtime option to enable/disable...
-    /*if (right == 0 && left > 0.2)
+    bool sync = !m_cfg.winkEnable;
+
+    if (m_cfg.winkEnable)
      {
-        left = 1;
+        if (rightEye < 0.1 && leftEye > 0.2)
+        {
+            leftEye = 1;
+            rightEye = 0;
+        }
+        else if (leftEye < 0.1 && rightEye > 0.2)
+        {
+            leftEye = 0;
+            rightEye = 1;
+        }
+        else
+        {
+            sync = true;
+        }
      }
-    else if (left == 0 && right > 0.2)
+
+    if (sync)
      {
-        right = 1;
+        // Combine the two to get better synchronized blinks
+        double bothEyes = (leftEye + rightEye) / 2;
+        leftEye = bothEyes;
+        rightEye = bothEyes;
      }
-    */
+
      params.leftEyeOpenness = leftEye;
      params.rightEyeOpenness = rightEye;
  
@@ -111,6 +132,10 @@ FacialLandmarkDetector::Params FacialLandmarkDetector::getParams(void) const
          params.rightEyeSmile = 0;
      }
  
+    params.autoBlink = m_cfg.autoBlink;
+    params.autoBreath = m_cfg.autoBreath;
+    params.randomMotion = m_cfg.randomMotion;
+
      return params;
  }
  
@@ -123,92 +148,78 @@ void FacialLandmarkDetector::mainLoop(void)
  {
      while (!m_stop)
      {
-        cv::Mat frame;
-        if (!webcam.read(frame))
-        {
-            throw std::runtime_error("Unable to read from webcam");
-        }
-        cv::Mat flipped;
-        if (m_cfg.lateralInversion)
-        {
-            cv::flip(frame, flipped, 1);
-        }
-        else
-        {
-            flipped = frame;
-        }
-        dlib::cv_image<dlib::bgr_pixel> cimg(flipped);
+        // Read UDP packet from OSF
+        static const int nPoints = 68;
+        static const int packetFrameSize = 8 + 4 + 2 * 4 + 2 * 4 + 1 + 4 + 3 * 4 + 3 * 4
+                                         + 4 * 4 + 4 * 68 + 4 * 2 * 68 + 4 * 3 * 70 + 4 * 14;
  
-        if (m_cfg.showWebcamVideo)
-        {
-            win.set_image(cimg);
-        }
+        static const int landmarksOffset = 8 + 4 + 2 * 4 + 2 * 4 + 1 + 4 + 3 * 4 + 3 * 4
+                                         + 4 * 4 + 4 * 68;
  
-        std::vector<dlib::rectangle> faces = detector(cimg);
+        uint8_t buf[packetFrameSize];
+        ssize_t recvSize = recv(m_sock, buf, sizeof buf, 0);
  
-        if (faces.size() > 0)
-        {
-            dlib::rectangle face = faces[0];
-            dlib::full_object_detection shape = predictor(cimg, face);
-
-            /* The coordinates seem to be rather noisy in general.
-             * We will push everything through some moving average filters
-             * to reduce noise. The number of taps is determined empirically
-             * until we get something good.
-             * An alternative method would be to get some better dataset
-             * for dlib - perhaps even to train on a custom data set just for the user.
-             */
-
-            // Face rotation: X direction (left-right)
-            double faceXRot = calcFaceXAngle(shape);
-            filterPush(m_faceXAngle, faceXRot, m_cfg.faceXAngleNumTaps);
-
-            // Mouth form (smile / laugh) detection
-            double mouthForm = calcMouthForm(shape);
-            filterPush(m_mouthForm, mouthForm, m_cfg.mouthFormNumTaps);
-
-            // Face rotation: Y direction (up-down)
-            double faceYRot = calcFaceYAngle(shape, faceXRot, mouthForm);
-            filterPush(m_faceYAngle, faceYRot, m_cfg.faceYAngleNumTaps);
-
-            // Face rotation: Z direction (head tilt)
-            double faceZRot = calcFaceZAngle(shape);
-            filterPush(m_faceZAngle, faceZRot, m_cfg.faceZAngleNumTaps);
-
-            // Mouth openness
-            double mouthOpen = calcMouthOpenness(shape, mouthForm);
-            filterPush(m_mouthOpenness, mouthOpen, m_cfg.mouthOpenNumTaps);
-
-            // Eye openness
-            double eyeLeftOpen = calcEyeOpenness(LEFT, shape, faceYRot);
-            filterPush(m_leftEyeOpenness, eyeLeftOpen, m_cfg.leftEyeOpenNumTaps);
-            double eyeRightOpen = calcEyeOpenness(RIGHT, shape, faceYRot);
-            filterPush(m_rightEyeOpenness, eyeRightOpen, m_cfg.rightEyeOpenNumTaps);
-
-            // TODO eyebrows?
-
-            if (m_cfg.showWebcamVideo && m_cfg.renderLandmarksOnVideo)
-            {
-                win.clear_overlay();
-                win.add_overlay(dlib::render_face_detections(shape));
-            }
-        }
-        else
+        if (recvSize != packetFrameSize) continue;
+        // Note: This is dependent on endianness, and we would assume that
+        // the OSF instance is run on a machine with the same endianness
+        // as our current machine.
+        int recvFaceId = *(int *)(buf + 8);
+        if (recvFaceId != m_faceId) continue; // We only support one face
+
+        Point landmarks[nPoints];
+
+        for (int i = 0; i < nPoints; i++)
          {
-            if (m_cfg.showWebcamVideo && m_cfg.renderLandmarksOnVideo)
-            {
-                win.clear_overlay();
-            }
+            float x = *(float *)(buf + landmarksOffset + i * 2 * sizeof(float));
+            float y = *(float *)(buf + landmarksOffset + (i * 2 + 1) * sizeof(float));
+
+            landmarks[i].x = x;
+            landmarks[i].y = y;
          }
  
-        cv::waitKey(m_cfg.cvWaitKeyMs);
+        /* The coordinates seem to be rather noisy in general.
+         * We will push everything through some moving average filters
+         * to reduce noise. The number of taps is determined empirically
+         * until we get something good.
+         * An alternative method would be to get some better dataset -
+         * perhaps even to train on a custom data set just for the user.
+         */
+
+        // Face rotation: X direction (left-right)
+        double faceXRot = calcFaceXAngle(landmarks);
+        filterPush(m_faceXAngle, faceXRot, m_cfg.faceXAngleNumTaps);
+
+        // Mouth form (smile / laugh) detection
+        double mouthForm = calcMouthForm(landmarks);
+        filterPush(m_mouthForm, mouthForm, m_cfg.mouthFormNumTaps);
+
+        // Face rotation: Y direction (up-down)
+        double faceYRot = calcFaceYAngle(landmarks, faceXRot, mouthForm);
+        filterPush(m_faceYAngle, faceYRot, m_cfg.faceYAngleNumTaps);
+
+        // Face rotation: Z direction (head tilt)
+        double faceZRot = calcFaceZAngle(landmarks);
+        filterPush(m_faceZAngle, faceZRot, m_cfg.faceZAngleNumTaps);
+
+        // Mouth openness
+        double mouthOpen = calcMouthOpenness(landmarks, mouthForm);
+        filterPush(m_mouthOpenness, mouthOpen, m_cfg.mouthOpenNumTaps);
+
+        // Eye openness
+        double eyeLeftOpen = calcEyeOpenness(LEFT, landmarks, faceYRot);
+        filterPush(m_leftEyeOpenness, eyeLeftOpen, m_cfg.leftEyeOpenNumTaps);
+        double eyeRightOpen = calcEyeOpenness(RIGHT, landmarks, faceYRot);
+        filterPush(m_rightEyeOpenness, eyeRightOpen, m_cfg.rightEyeOpenNumTaps);
+
+        // Eyebrows: the landmark detection doesn't work very well for my face,
+        // so I've not implemented them.
      }
  }
  
  double FacialLandmarkDetector::calcEyeAspectRatio(
-    dlib::point& p1, dlib::point& p2,
-    dlib::point& p3, dlib::point& p4,
-    dlib::point& p5, dlib::point& p6) const
+    Point& p1, Point& p2,
+    Point& p3, Point& p4,
+    Point& p5, Point& p6) const
  {
      double eyeWidth = dist(p1, p4);
      double eyeHeight1 = dist(p2, p6);
@@ -219,19 +230,19 @@ double FacialLandmarkDetector::calcEyeAspectRatio(
  
  double FacialLandmarkDetector::calcEyeOpenness(
      LeftRight eye,
-    dlib::full_object_detection& shape,
+    Point landmarks[],
      double faceYAngle) const
  {
      double eyeAspectRatio;
      if (eye == LEFT)
      {
-        eyeAspectRatio = calcEyeAspectRatio(shape.part(42), shape.part(43), shape.part(44),
-                                            shape.part(45), shape.part(46), shape.part(47));
+        eyeAspectRatio = calcEyeAspectRatio(landmarks[42], landmarks[43], landmarks[44],
+                                            landmarks[45], landmarks[46], landmarks[47]);
      }
      else
      {
-        eyeAspectRatio = calcEyeAspectRatio(shape.part(36), shape.part(37), shape.part(38),
-                                            shape.part(39), shape.part(40), shape.part(41));
+        eyeAspectRatio = calcEyeAspectRatio(landmarks[36], landmarks[37], landmarks[38],
+                                            landmarks[39], landmarks[40], landmarks[41]);
      }
  
      // Apply correction due to faceYAngle
@@ -242,7 +253,7 @@ double FacialLandmarkDetector::calcEyeOpenness(
  
  
  
-double FacialLandmarkDetector::calcMouthForm(dlib::full_object_detection& shape) const
+double FacialLandmarkDetector::calcMouthForm(Point landmarks[]) const
  {
      /* Mouth form parameter: 0 for normal mouth, 1 for fully smiling / laughing.
       * Compare distance between the two corners of the mouth
@@ -256,12 +267,12 @@ double FacialLandmarkDetector::calcMouthForm(dlib::full_object_detection& shape)
       * the angle changes. So here we'll use the distance approach instead.
       */
  
-    auto eye1 = centroid(shape.part(36), shape.part(37), shape.part(38),
-                         shape.part(39), shape.part(40), shape.part(41));
-    auto eye2 = centroid(shape.part(42), shape.part(43), shape.part(44),
-                         shape.part(45), shape.part(46), shape.part(47));
+    auto eye1 = centroid(landmarks[36], landmarks[37], landmarks[38],
+                         landmarks[39], landmarks[40], landmarks[41]);
+    auto eye2 = centroid(landmarks[42], landmarks[43], landmarks[44],
+                         landmarks[45], landmarks[46], landmarks[47]);
      double distEyes = dist(eye1, eye2);
-    double distMouth = dist(shape.part(48), shape.part(54));
+    double distMouth = dist(landmarks[58], landmarks[62]);
  
      double form = linearScale01(distMouth / distEyes,
                                  m_cfg.mouthNormalThreshold,
@@ -271,21 +282,21 @@ double FacialLandmarkDetector::calcMouthForm(dlib::full_object_detection& shape)
  }
  
  double FacialLandmarkDetector::calcMouthOpenness(
-    dlib::full_object_detection& shape,
+    Point landmarks[],
      double mouthForm) const
  {
      // Use points for the bottom of the upper lip, and top of the lower lip
      // We have 3 pairs of points available, which give the mouth height
      // on the left, in the middle, and on the right, resp.
      // First let's try to use an average of all three.
-    double heightLeft = dist(shape.part(63), shape.part(65));
-    double heightMiddle = dist(shape.part(62), shape.part(66));
-    double heightRight = dist(shape.part(61), shape.part(67));
+    double heightLeft   = dist(landmarks[61], landmarks[63]);
+    double heightMiddle = dist(landmarks[60], landmarks[64]);
+    double heightRight  = dist(landmarks[59], landmarks[65]);
  
      double avgHeight = (heightLeft + heightMiddle + heightRight) / 3;
  
      // Now, normalize it with the width of the mouth.
-    double width = dist(shape.part(60), shape.part(64));
+    double width = dist(landmarks[58], landmarks[62]);
  
      double normalized = avgHeight / width;
  
@@ -301,24 +312,24 @@ double FacialLandmarkDetector::calcMouthOpenness(
      return scaled;
  }
  
-double FacialLandmarkDetector::calcFaceXAngle(dlib::full_object_detection& shape) const
+double FacialLandmarkDetector::calcFaceXAngle(Point landmarks[]) const
  {
      // This function will be easier to understand if you refer to the
      // diagram in faceXAngle.png
  
      // Construct the y-axis using (1) average of four points on the nose and
-    // (2) average of four points on the upper lip.
+    // (2) average of five points on the upper lip.
  
-    auto y0 = centroid(shape.part(27), shape.part(28), shape.part(29),
-                       shape.part(30));
-    auto y1 = centroid(shape.part(50), shape.part(51), shape.part(52),
-                       shape.part(62));
+    auto y0 = centroid(landmarks[27], landmarks[28], landmarks[29],
+                       landmarks[30]);
+    auto y1 = centroid(landmarks[48], landmarks[49], landmarks[50],
+                       landmarks[51], landmarks[52]);
  
      // Now drop a perpedicular from the left and right edges of the face,
      // and calculate the ratio between the lengths of these perpendiculars
  
-    auto left = centroid(shape.part(14), shape.part(15), shape.part(16));
-    auto right = centroid(shape.part(0), shape.part(1), shape.part(2));
+    auto left = centroid(landmarks[14], landmarks[15], landmarks[16]);
+    auto right = centroid(landmarks[0], landmarks[1], landmarks[2]);
  
      // Constructing a perpendicular:
      // Join the left/right point and the upper lip. The included angle
@@ -345,13 +356,13 @@ double FacialLandmarkDetector::calcFaceXAngle(dlib::full_object_detection& shape
      return theta;
  }
  
-double FacialLandmarkDetector::calcFaceYAngle(dlib::full_object_detection& shape, double faceXAngle, double mouthForm) const
+double FacialLandmarkDetector::calcFaceYAngle(Point landmarks[], double faceXAngle, double mouthForm) const
  {
      // Use the nose
      // angle between the two left/right points and the tip
-    double c = dist(shape.part(31), shape.part(35));
-    double a = dist(shape.part(30), shape.part(31));
-    double b = dist(shape.part(30), shape.part(35));
+    double c = dist(landmarks[31], landmarks[35]);
+    double a = dist(landmarks[30], landmarks[31]);
+    double b = dist(landmarks[30], landmarks[35]);
  
      double angle = solveCosineRuleAngle(c, a, b);
  
@@ -383,25 +394,25 @@ double FacialLandmarkDetector::calcFaceYAngle(dlib::full_object_detection& shape
      }
  }
  
-double FacialLandmarkDetector::calcFaceZAngle(dlib::full_object_detection& shape) const
+double FacialLandmarkDetector::calcFaceZAngle(Point landmarks[]) const
  {
      // Use average of eyes and nose
  
-    auto eyeRight = centroid(shape.part(36), shape.part(37), shape.part(38),
-                             shape.part(39), shape.part(40), shape.part(41));
-    auto eyeLeft = centroid(shape.part(42), shape.part(43), shape.part(44),
-                            shape.part(45), shape.part(46), shape.part(47));
+    auto eyeRight = centroid(landmarks[36], landmarks[37], landmarks[38],
+                             landmarks[39], landmarks[40], landmarks[41]);
+    auto eyeLeft  = centroid(landmarks[42], landmarks[43], landmarks[44],
+                             landmarks[45], landmarks[46], landmarks[47]);
  
-    auto noseLeft = shape.part(35);
-    auto noseRight = shape.part(31);
+    auto noseLeft  = landmarks[35];
+    auto noseRight = landmarks[31];
  
-    double eyeYDiff = eyeRight.y() - eyeLeft.y();
-    double eyeXDiff = eyeRight.x() - eyeLeft.x();
+    double eyeYDiff = eyeRight.y - eyeLeft.y;
+    double eyeXDiff = eyeRight.x - eyeLeft.x;
  
      double angle1 = std::atan(eyeYDiff / eyeXDiff);
  
-    double noseYDiff = noseRight.y() - noseLeft.y();
-    double noseXDiff = noseRight.x() - noseLeft.x();
+    double noseYDiff = noseRight.y - noseLeft.y;
+    double noseXDiff = noseRight.x - noseLeft.x;
  
      double angle2 = std::atan(noseYDiff / noseXDiff);
  
@@ -436,19 +447,19 @@ void FacialLandmarkDetector::parseConfig(std::string cfgPath)
              std::string paramName;
              if (ss >> paramName)
              {
-                if (paramName == "cvVideoCaptureId")
+                if (paramName == "osfIpAddress")
                  {
-                    if (!(ss >> m_cfg.cvVideoCaptureId))
+                    if (!(ss >> m_cfg.osfIpAddress))
                      {
-                        throwConfigError(paramName, "int",
+                        throwConfigError(paramName, "std::string",
                                           line, lineNum);
                      }
                  }
-                else if (paramName == "predictorPath")
+                else if (paramName == "osfPort")
                  {
-                    if (!(ss >> m_cfg.predictorPath))
+                    if (!(ss >> m_cfg.osfPort))
                      {
-                        throwConfigError(paramName, "std::string",
+                        throwConfigError(paramName, "int",
                                           line, lineNum);
                      }
                  }
@@ -484,30 +495,6 @@ void FacialLandmarkDetector::parseConfig(std::string cfgPath)
                                           line, lineNum);
                      }
                  }
-                else if (paramName == "showWebcamVideo")
-                {
-                    if (!(ss >> m_cfg.showWebcamVideo))
-                    {
-                        throwConfigError(paramName, "bool",
-                                         line, lineNum);
-                    }
-                }
-                else if (paramName == "renderLandmarksOnVideo")
-                {
-                    if (!(ss >> m_cfg.renderLandmarksOnVideo))
-                    {
-                        throwConfigError(paramName, "bool",
-                                         line, lineNum);
-                    }
-                }
-                else if (paramName == "lateralInversion")
-                {
-                    if (!(ss >> m_cfg.lateralInversion))
-                    {
-                        throwConfigError(paramName, "bool",
-                                         line, lineNum);
-                    }
-                }
                  else if (paramName == "faceXAngleNumTaps")
                  {
                      if (!(ss >> m_cfg.faceXAngleNumTaps))
@@ -564,14 +551,6 @@ void FacialLandmarkDetector::parseConfig(std::string cfgPath)
                                           line, lineNum);
                      }
                  }
-                else if (paramName == "cvWaitKeyMs")
-                {
-                    if (!(ss >> m_cfg.cvWaitKeyMs))
-                    {
-                        throwConfigError(paramName, "int",
-                                         line, lineNum);
-                    }
-                }
                  else if (paramName == "eyeClosedThreshold")
                  {
                      if (!(ss >> m_cfg.eyeClosedThreshold))
@@ -588,6 +567,14 @@ void FacialLandmarkDetector::parseConfig(std::string cfgPath)
                                           line, lineNum);
                      }
                  }
+                else if (paramName == "winkEnable")
+                {
+                    if (!(ss >> m_cfg.winkEnable))
+                    {
+                        throwConfigError(paramName, "bool",
+                                         line, lineNum);
+                    }
+                }
                  else if (paramName == "mouthNormalThreshold")
                  {
                      if (!(ss >> m_cfg.mouthNormalThreshold))
@@ -668,6 +655,30 @@ void FacialLandmarkDetector::parseConfig(std::string cfgPath)
                                           line, lineNum);
                      }
                  }
+                else if (paramName == "autoBlink")
+                {
+                    if (!(ss >> m_cfg.autoBlink))
+                    {
+                        throwConfigError(paramName, "bool",
+                                         line, lineNum);
+                    }
+                }
+                else if (paramName == "autoBreath")
+                {
+                    if (!(ss >> m_cfg.autoBreath))
+                    {
+                        throwConfigError(paramName, "bool",
+                                         line, lineNum);
+                    }
+                }
+                else if (paramName == "randomMotion")
+                {
+                    if (!(ss >> m_cfg.randomMotion))
+                    {
+                        throwConfigError(paramName, "bool",
+                                         line, lineNum);
+                    }
+                }
                  else
                  {
                      std::ostringstream oss;
@@ -685,25 +696,20 @@ void FacialLandmarkDetector::populateDefaultConfig(void)
      // These are values that I've personally tested to work OK for my face.
      // Your milage may vary - hence the config file.
  
-    m_cfg.cvVideoCaptureId = 0;
-    m_cfg.predictorPath = "shape_predictor_68_face_landmarks.dat";
      m_cfg.faceYAngleCorrection = 10;
      m_cfg.eyeSmileEyeOpenThreshold = 0.6;
      m_cfg.eyeSmileMouthFormThreshold = 0.75;
      m_cfg.eyeSmileMouthOpenThreshold = 0.5;
-    m_cfg.showWebcamVideo = true;
-    m_cfg.renderLandmarksOnVideo = true;
-    m_cfg.lateralInversion = true;
-    m_cfg.cvWaitKeyMs = 5;
-    m_cfg.faceXAngleNumTaps = 11;
-    m_cfg.faceYAngleNumTaps = 11;
-    m_cfg.faceZAngleNumTaps = 11;
+    m_cfg.faceXAngleNumTaps = 7;
+    m_cfg.faceYAngleNumTaps = 7;
+    m_cfg.faceZAngleNumTaps = 7;
      m_cfg.mouthFormNumTaps = 3;
      m_cfg.mouthOpenNumTaps = 3;
      m_cfg.leftEyeOpenNumTaps = 3;
      m_cfg.rightEyeOpenNumTaps = 3;
-    m_cfg.eyeClosedThreshold = 0.2;
-    m_cfg.eyeOpenThreshold = 0.25;
+    m_cfg.eyeClosedThreshold = 0.18;
+    m_cfg.eyeOpenThreshold = 0.21;
+    m_cfg.winkEnable = true;
      m_cfg.mouthNormalThreshold = 0.75;
      m_cfg.mouthSmileThreshold = 1.0;
      m_cfg.mouthClosedThreshold = 0.1;
@@ -714,6 +720,9 @@ void FacialLandmarkDetector::populateDefaultConfig(void)
      m_cfg.faceYAngleZeroValue = 1.8;
      m_cfg.faceYAngleDownThreshold = 2.3;
      m_cfg.faceYAngleUpThreshold = 1.3;
+    m_cfg.autoBlink = false;
+    m_cfg.autoBreath = false;
+    m_cfg.randomMotion = false;
  }
  
  void FacialLandmarkDetector::throwConfigError(std::string paramName,