Working on full frame video support.

2025-03-11 16:13:16 +01:00 · 2013-07-31 17:06:09 -07:00 · 2013-07-31 17:06:09 -07:00 · d18a9dc499
commit d18a9dc499
parent 415949cc26
2 changed files with 224 additions and 185 deletions
--- a/interface/src/Webcam.cpp
+++ b/interface/src/Webcam.cpp
@ -270,7 +270,7 @@ void Webcam::setFrame(const Mat& color, int format, const Mat& depth, float midF
    QTimer::singleShot(qMax((int)remaining / 1000, 0), _grabber, SLOT(grabFrame()));
 }

-FrameGrabber::FrameGrabber() : _initialized(false), _capture(0), _searchWindow(0, 0, 0, 0),
+FrameGrabber::FrameGrabber() : _initialized(false), _videoSendMode(FULL_FRAME_VIDEO), _capture(0), _searchWindow(0, 0, 0, 0),
    _smoothedMidFaceDepth(UNINITIALIZED_FACE_DEPTH), _colorCodec(), _depthCodec(), _frameCount(0) {
 }

@ -364,6 +364,11 @@ static void XN_CALLBACK_TYPE calibrationCompleted(SkeletonCapability& capability
 }
 #endif

+void FrameGrabber::cycleVideoSendMode() {
+    _videoSendMode = (VideoSendMode)((_videoSendMode + 1) % VIDEO_SEND_MODE_COUNT);
+    _searchWindow = cv::Rect(0, 0, 0, 0);
+}
+
 void FrameGrabber::reset() {
    _searchWindow = cv::Rect(0, 0, 0, 0);

@ -462,56 +467,54 @@ void FrameGrabber::grabFrame() {
        color = image;
    }
    
-    // if we don't have a search window (yet), try using the face cascade
-    int channels = 0;
-    float ranges[] = { 0, 180 };
-    const float* range = ranges;
-    if (_searchWindow.area() == 0) {
-        vector<Rect> faces;
-        _faceCascade.detectMultiScale(color, faces, 1.1, 6);
-        if (!faces.empty()) {
-            _searchWindow = faces.front();
-            updateHSVFrame(color, format);
-        
-            Mat faceHsv(_hsvFrame, _searchWindow);
-            Mat faceMask(_mask, _searchWindow);
-            int sizes = 30;
-            calcHist(&faceHsv, 1, &channels, faceMask, _histogram, 1, &sizes, &range);
-            double min, max;
-            minMaxLoc(_histogram, &min, &max);
-            _histogram.convertTo(_histogram, -1, (max == 0.0) ? 0.0 : 255.0 / max);
-        }
-    }
    RotatedRect faceRect;
-    if (_searchWindow.area() > 0) {
-        updateHSVFrame(color, format);
+    int encodedWidth;
+    int encodedHeight;
+    int depthBitrateMultiplier = 1;
+    if (_videoSendMode == FULL_FRAME_VIDEO) {
+        // no need to find the face if we're sending full frame video
+        faceRect.center = Point2f(color.cols / 2.0f, color.rows / 2.0f);
+        faceRect.size = Size2f(color.cols, color.rows);
+        encodedWidth = color.cols;
+        encodedHeight = color.rows;
        
-        calcBackProject(&_hsvFrame, 1, &channels, _histogram, _backProject, &range);
-        bitwise_and(_backProject, _mask, _backProject);
-        
-        faceRect = CamShift(_backProject, _searchWindow, TermCriteria(CV_TERMCRIT_EPS | CV_TERMCRIT_ITER, 10, 1));
-        Rect faceBounds = faceRect.boundingRect();
-        Rect imageBounds(0, 0, color.cols, color.rows);
-        _searchWindow = Rect(clip(faceBounds.tl(), imageBounds), clip(faceBounds.br(), imageBounds));
-    }
-    
-    const int ENCODED_FACE_WIDTH = 128;
-    const int ENCODED_FACE_HEIGHT = 128;
-    if (_colorCodec.name == 0) {
-        // initialize encoder context(s)
-        vpx_codec_enc_cfg_t codecConfig;
-        vpx_codec_enc_config_default(vpx_codec_vp8_cx(), &codecConfig, 0);
-        codecConfig.rc_target_bitrate = ENCODED_FACE_WIDTH * ENCODED_FACE_HEIGHT *
-            codecConfig.rc_target_bitrate / codecConfig.g_w / codecConfig.g_h;
-        codecConfig.g_w = ENCODED_FACE_WIDTH;
-        codecConfig.g_h = ENCODED_FACE_HEIGHT;
-        vpx_codec_enc_init(&_colorCodec, vpx_codec_vp8_cx(), &codecConfig, 0);
-        
-        if (!depth.empty()) {
-            int DEPTH_BITRATE_MULTIPLIER = 2;
-            codecConfig.rc_target_bitrate *= 2;
-            vpx_codec_enc_init(&_depthCodec, vpx_codec_vp8_cx(), &codecConfig, 0);
+    } else {
+        // if we don't have a search window (yet), try using the face cascade
+        int channels = 0;
+        float ranges[] = { 0, 180 };
+        const float* range = ranges;
+        if (_searchWindow.area() == 0) {
+            vector<Rect> faces;
+            _faceCascade.detectMultiScale(color, faces, 1.1, 6);
+            if (!faces.empty()) {
+                _searchWindow = faces.front();
+                updateHSVFrame(color, format);
+            
+                Mat faceHsv(_hsvFrame, _searchWindow);
+                Mat faceMask(_mask, _searchWindow);
+                int sizes = 30;
+                calcHist(&faceHsv, 1, &channels, faceMask, _histogram, 1, &sizes, &range);
+                double min, max;
+                minMaxLoc(_histogram, &min, &max);
+                _histogram.convertTo(_histogram, -1, (max == 0.0) ? 0.0 : 255.0 / max);
+            }
        }
+        if (_searchWindow.area() > 0) {
+            updateHSVFrame(color, format);
+            
+            calcBackProject(&_hsvFrame, 1, &channels, _histogram, _backProject, &range);
+            bitwise_and(_backProject, _mask, _backProject);
+            
+            faceRect = CamShift(_backProject, _searchWindow, TermCriteria(CV_TERMCRIT_EPS | CV_TERMCRIT_ITER, 10, 1));
+            Rect faceBounds = faceRect.boundingRect();
+            Rect imageBounds(0, 0, color.cols, color.rows);
+            _searchWindow = Rect(clip(faceBounds.tl(), imageBounds), clip(faceBounds.br(), imageBounds));
+        }
+        const int ENCODED_FACE_WIDTH = 128;
+        const int ENCODED_FACE_HEIGHT = 128;
+        encodedWidth = ENCODED_FACE_WIDTH;
+        encodedHeight = ENCODED_FACE_HEIGHT;
+        depthBitrateMultiplier = 2;
    }
    
    // correct for 180 degree rotations
@ -535,150 +538,86 @@ void FrameGrabber::grabFrame() {
        _smoothedFaceRect.angle = glm::mix(faceRect.angle, _smoothedFaceRect.angle, FACE_RECT_SMOOTHING);
    }
    
-    // resize/rotate face into encoding rectangle
-    _faceColor.create(ENCODED_FACE_WIDTH, ENCODED_FACE_HEIGHT, CV_8UC3);
-    Point2f sourcePoints[4];
-    _smoothedFaceRect.points(sourcePoints);
-    Point2f destPoints[] = { Point2f(0, ENCODED_FACE_HEIGHT), Point2f(0, 0), Point2f(ENCODED_FACE_WIDTH, 0) };
-    Mat transform = getAffineTransform(sourcePoints, destPoints);
-    warpAffine(color, _faceColor, transform, _faceColor.size());
-    
-    // convert from RGB to YV12
-    const int ENCODED_BITS_PER_Y = 8;
-    const int ENCODED_BITS_PER_VU = 2;
-    const int ENCODED_BITS_PER_PIXEL = ENCODED_BITS_PER_Y + 2 * ENCODED_BITS_PER_VU;
-    const int BITS_PER_BYTE = 8;
-    _encodedFace.resize(ENCODED_FACE_WIDTH * ENCODED_FACE_HEIGHT * ENCODED_BITS_PER_PIXEL / BITS_PER_BYTE);
-    vpx_image_t vpxImage;
-    vpx_img_wrap(&vpxImage, VPX_IMG_FMT_YV12, ENCODED_FACE_WIDTH, ENCODED_FACE_HEIGHT, 1, (unsigned char*)_encodedFace.data());
-    uchar* yline = vpxImage.planes[0];
-    uchar* vline = vpxImage.planes[1];
-    uchar* uline = vpxImage.planes[2];
-    const int Y_RED_WEIGHT = (int)(0.299 * 256);
-    const int Y_GREEN_WEIGHT = (int)(0.587 * 256);
-    const int Y_BLUE_WEIGHT = (int)(0.114 * 256);
-    const int V_RED_WEIGHT = (int)(0.713 * 256);
-    const int U_BLUE_WEIGHT = (int)(0.564 * 256);
-    int redIndex = 0;
-    int greenIndex = 1;
-    int blueIndex = 2;
-    if (format == GL_BGR) {
-        redIndex = 2;
-        blueIndex = 0;
-    }
-    for (int i = 0; i < ENCODED_FACE_HEIGHT; i += 2) {
-        uchar* ydest = yline;
-        uchar* vdest = vline;
-        uchar* udest = uline;
-        for (int j = 0; j < ENCODED_FACE_WIDTH; j += 2) {
-            uchar* tl = _faceColor.ptr(i, j);
-            uchar* tr = _faceColor.ptr(i, j + 1);
-            uchar* bl = _faceColor.ptr(i + 1, j);
-            uchar* br = _faceColor.ptr(i + 1, j + 1);
+    if (_videoSendMode != NO_VIDEO) {
+        if (_colorCodec.name == 0) {
+            // initialize encoder context(s)
+            vpx_codec_enc_cfg_t codecConfig;
+            vpx_codec_enc_config_default(vpx_codec_vp8_cx(), &codecConfig, 0);
+            codecConfig.rc_target_bitrate = encodedWidth * encodedHeight *
+                codecConfig.rc_target_bitrate / codecConfig.g_w / codecConfig.g_h;
+            codecConfig.g_w = encodedWidth;
+            codecConfig.g_h = encodedHeight;
+            vpx_codec_enc_init(&_colorCodec, vpx_codec_vp8_cx(), &codecConfig, 0);
            
-            ydest[0] = (tl[redIndex] * Y_RED_WEIGHT + tl[1] * Y_GREEN_WEIGHT + tl[blueIndex] * Y_BLUE_WEIGHT) >> 8;
-            ydest[1] = (tr[redIndex] * Y_RED_WEIGHT + tr[1] * Y_GREEN_WEIGHT + tr[blueIndex] * Y_BLUE_WEIGHT) >> 8;
-            ydest[vpxImage.stride[0]] = (bl[redIndex] * Y_RED_WEIGHT + bl[greenIndex] *
-                Y_GREEN_WEIGHT + bl[blueIndex] * Y_BLUE_WEIGHT) >> 8;
-            ydest[vpxImage.stride[0] + 1] = (br[redIndex] * Y_RED_WEIGHT + br[greenIndex] *
-                Y_GREEN_WEIGHT + br[blueIndex] * Y_BLUE_WEIGHT) >> 8;
-            ydest += 2;
-            
-            int totalRed = tl[redIndex] + tr[redIndex] + bl[redIndex] + br[redIndex];
-            int totalGreen = tl[greenIndex] + tr[greenIndex] + bl[greenIndex] + br[greenIndex];
-            int totalBlue = tl[blueIndex] + tr[blueIndex] + bl[blueIndex] + br[blueIndex];
-            int totalY = (totalRed * Y_RED_WEIGHT + totalGreen * Y_GREEN_WEIGHT + totalBlue * Y_BLUE_WEIGHT) >> 8;
-            
-            *vdest++ = (((totalRed - totalY) * V_RED_WEIGHT) >> 10) + 128;
-            *udest++ = (((totalBlue - totalY) * U_BLUE_WEIGHT) >> 10) + 128;
-        }
-        yline += vpxImage.stride[0] * 2;
-        vline += vpxImage.stride[1];
-        uline += vpxImage.stride[2];
-    }
-    
-    // encode the frame
-    vpx_codec_encode(&_colorCodec, &vpxImage, ++_frameCount, 1, 0, VPX_DL_REALTIME);
-
-    // start the payload off with the aspect ratio
-    QByteArray payload(sizeof(float), 0);
-    *(float*)payload.data() = _smoothedFaceRect.size.width / _smoothedFaceRect.size.height;
-
-    // extract the encoded frame
-    vpx_codec_iter_t iterator = 0;
-    const vpx_codec_cx_pkt_t* packet;
-    while ((packet = vpx_codec_get_cx_data(&_colorCodec, &iterator)) != 0) {
-        if (packet->kind == VPX_CODEC_CX_FRAME_PKT) {
-            // prepend the length, which will indicate whether there's a depth frame too
-            payload.append((const char*)&packet->data.frame.sz, sizeof(packet->data.frame.sz));
-            payload.append((const char*)packet->data.frame.buf, packet->data.frame.sz);
-        }
-    }
-    
-    if (!depth.empty()) {
-        // warp the face depth without interpolation (because it will contain invalid zero values)
-        _faceDepth.create(ENCODED_FACE_WIDTH, ENCODED_FACE_HEIGHT, CV_16UC1);
-        warpAffine(depth, _faceDepth, transform, _faceDepth.size(), INTER_NEAREST);
-        
-        _smoothedFaceDepth.create(ENCODED_FACE_WIDTH, ENCODED_FACE_HEIGHT, CV_16UC1);
-        
-        // smooth the depth over time
-        const ushort ELEVEN_BIT_MINIMUM = 0;
-        const ushort ELEVEN_BIT_MAXIMUM = 2047;
-        const float DEPTH_SMOOTHING = 0.25f;
-        ushort* src = _faceDepth.ptr<ushort>();
-        ushort* dest = _smoothedFaceDepth.ptr<ushort>();
-        ushort minimumDepth = numeric_limits<ushort>::max();
-        for (int i = 0; i < ENCODED_FACE_HEIGHT; i++) {
-            for (int j = 0; j < ENCODED_FACE_WIDTH; j++) {
-                ushort depth = *src++;
-                if (depth != ELEVEN_BIT_MINIMUM && depth != ELEVEN_BIT_MAXIMUM) {
-                    minimumDepth = min(minimumDepth, depth);
-                    *dest = (*dest == ELEVEN_BIT_MINIMUM) ? depth : (ushort)glm::mix(depth, *dest, DEPTH_SMOOTHING);
-                }
-                dest++;
+            if (!depth.empty()) {
+                codecConfig.rc_target_bitrate *= depthBitrateMultiplier;
+                vpx_codec_enc_init(&_depthCodec, vpx_codec_vp8_cx(), &codecConfig, 0);
            }
        }
-        const ushort MINIMUM_DEPTH_OFFSET = 64;
-        float midFaceDepth = minimumDepth + MINIMUM_DEPTH_OFFSET;
+    
+        Mat transform;
+        if (_videoSendMode == FACE_VIDEO) {
+            // resize/rotate face into encoding rectangle
+            _faceColor.create(encodedHeight, encodedWidth, CV_8UC3);
+            Point2f sourcePoints[4];
+            _smoothedFaceRect.points(sourcePoints);
+            Point2f destPoints[] = { Point2f(0, encodedHeight), Point2f(0, 0), Point2f(encodedWidth, 0) };
+            transform = getAffineTransform(sourcePoints, destPoints);
+            warpAffine(color, _faceColor, transform, _faceColor.size());
        
-        // smooth the mid face depth over time
-        const float MID_FACE_DEPTH_SMOOTHING = 0.5f;
-        _smoothedMidFaceDepth = (_smoothedMidFaceDepth == UNINITIALIZED_FACE_DEPTH) ? midFaceDepth :
-            glm::mix(midFaceDepth, _smoothedMidFaceDepth, MID_FACE_DEPTH_SMOOTHING);
-
-        // convert from 11 to 8 bits for preview/local display
-        const uchar EIGHT_BIT_MIDPOINT = 128;
-        double depthOffset = EIGHT_BIT_MIDPOINT - _smoothedMidFaceDepth;
-        depth.convertTo(_grayDepthFrame, CV_8UC1, 1.0, depthOffset);
-
-        // likewise for the encoded representation
+        } else {
+            _faceColor = color;
+        }
+        
+        // convert from RGB to YV12
+        const int ENCODED_BITS_PER_Y = 8;
+        const int ENCODED_BITS_PER_VU = 2;
+        const int ENCODED_BITS_PER_PIXEL = ENCODED_BITS_PER_Y + 2 * ENCODED_BITS_PER_VU;
+        const int BITS_PER_BYTE = 8;
+        _encodedFace.resize(encodedWidth * encodedHeight * ENCODED_BITS_PER_PIXEL / BITS_PER_BYTE);
+        vpx_image_t vpxImage;
+        vpx_img_wrap(&vpxImage, VPX_IMG_FMT_YV12, encodedWidth, encodedHeight, 1,
+            (unsigned char*)_encodedFace.data());
        uchar* yline = vpxImage.planes[0];
        uchar* vline = vpxImage.planes[1];
        uchar* uline = vpxImage.planes[2];
-        const uchar EIGHT_BIT_MAXIMUM = 255;
-        for (int i = 0; i < ENCODED_FACE_HEIGHT; i += 2) {
+        const int Y_RED_WEIGHT = (int)(0.299 * 256);
+        const int Y_GREEN_WEIGHT = (int)(0.587 * 256);
+        const int Y_BLUE_WEIGHT = (int)(0.114 * 256);
+        const int V_RED_WEIGHT = (int)(0.713 * 256);
+        const int U_BLUE_WEIGHT = (int)(0.564 * 256);
+        int redIndex = 0;
+        int greenIndex = 1;
+        int blueIndex = 2;
+        if (format == GL_BGR) {
+            redIndex = 2;
+            blueIndex = 0;
+        }
+        for (int i = 0; i < encodedHeight; i += 2) {
            uchar* ydest = yline;
            uchar* vdest = vline;
            uchar* udest = uline;
-            for (int j = 0; j < ENCODED_FACE_WIDTH; j += 2) {
-                ushort tl = *_smoothedFaceDepth.ptr<ushort>(i, j);
-                ushort tr = *_smoothedFaceDepth.ptr<ushort>(i, j + 1);
-                ushort bl = *_smoothedFaceDepth.ptr<ushort>(i + 1, j);
-                ushort br = *_smoothedFaceDepth.ptr<ushort>(i + 1, j + 1);
-            
-                uchar mask = EIGHT_BIT_MAXIMUM;
+            for (int j = 0; j < encodedWidth; j += 2) {
+                uchar* tl = _faceColor.ptr(i, j);
+                uchar* tr = _faceColor.ptr(i, j + 1);
+                uchar* bl = _faceColor.ptr(i + 1, j);
+                uchar* br = _faceColor.ptr(i + 1, j + 1);
                
-                ydest[0] = (tl == ELEVEN_BIT_MINIMUM) ? (mask = EIGHT_BIT_MIDPOINT) : saturate_cast<uchar>(tl + depthOffset);
-                ydest[1] = (tr == ELEVEN_BIT_MINIMUM) ? (mask = EIGHT_BIT_MIDPOINT) : saturate_cast<uchar>(tr + depthOffset);
-                ydest[vpxImage.stride[0]] = (bl == ELEVEN_BIT_MINIMUM) ?
-                    (mask = EIGHT_BIT_MIDPOINT) : saturate_cast<uchar>(bl + depthOffset);
-                ydest[vpxImage.stride[0] + 1] = (br == ELEVEN_BIT_MINIMUM) ?
-                    (mask = EIGHT_BIT_MIDPOINT) : saturate_cast<uchar>(br + depthOffset);
+                ydest[0] = (tl[redIndex] * Y_RED_WEIGHT + tl[1] * Y_GREEN_WEIGHT + tl[blueIndex] * Y_BLUE_WEIGHT) >> 8;
+                ydest[1] = (tr[redIndex] * Y_RED_WEIGHT + tr[1] * Y_GREEN_WEIGHT + tr[blueIndex] * Y_BLUE_WEIGHT) >> 8;
+                ydest[vpxImage.stride[0]] = (bl[redIndex] * Y_RED_WEIGHT + bl[greenIndex] *
+                    Y_GREEN_WEIGHT + bl[blueIndex] * Y_BLUE_WEIGHT) >> 8;
+                ydest[vpxImage.stride[0] + 1] = (br[redIndex] * Y_RED_WEIGHT + br[greenIndex] *
+                    Y_GREEN_WEIGHT + br[blueIndex] * Y_BLUE_WEIGHT) >> 8;
                ydest += 2;
-            
-                *vdest++ = mask;
-                *udest++ = EIGHT_BIT_MIDPOINT;
+                
+                int totalRed = tl[redIndex] + tr[redIndex] + bl[redIndex] + br[redIndex];
+                int totalGreen = tl[greenIndex] + tr[greenIndex] + bl[greenIndex] + br[greenIndex];
+                int totalBlue = tl[blueIndex] + tr[blueIndex] + bl[blueIndex] + br[blueIndex];
+                int totalY = (totalRed * Y_RED_WEIGHT + totalGreen * Y_GREEN_WEIGHT + totalBlue * Y_BLUE_WEIGHT) >> 8;
+                
+                *vdest++ = (((totalRed - totalY) * V_RED_WEIGHT) >> 10) + 128;
+                *udest++ = (((totalBlue - totalY) * U_BLUE_WEIGHT) >> 10) + 128;
            }
            yline += vpxImage.stride[0] * 2;
            vline += vpxImage.stride[1];
@ -686,21 +625,117 @@ void FrameGrabber::grabFrame() {
        }
        
        // encode the frame
-        vpx_codec_encode(&_depthCodec, &vpxImage, _frameCount, 1, 0, VPX_DL_REALTIME);
+        vpx_codec_encode(&_colorCodec, &vpxImage, ++_frameCount, 1, 0, VPX_DL_REALTIME);
+
+        // start the payload off with the aspect ratio
+        QByteArray payload(sizeof(float), 0);
+        *(float*)payload.data() = _smoothedFaceRect.size.width / _smoothedFaceRect.size.height;

        // extract the encoded frame
        vpx_codec_iter_t iterator = 0;
        const vpx_codec_cx_pkt_t* packet;
-        while ((packet = vpx_codec_get_cx_data(&_depthCodec, &iterator)) != 0) {
+        while ((packet = vpx_codec_get_cx_data(&_colorCodec, &iterator)) != 0) {
            if (packet->kind == VPX_CODEC_CX_FRAME_PKT) {
+                // prepend the length, which will indicate whether there's a depth frame too
+                payload.append((const char*)&packet->data.frame.sz, sizeof(packet->data.frame.sz));
                payload.append((const char*)packet->data.frame.buf, packet->data.frame.sz);
            }
        }
+        
+        if (!depth.empty()) {
+            if (_videoSendMode == FACE_VIDEO) {
+                // warp the face depth without interpolation (because it will contain invalid zero values)
+                _faceDepth.create(encodedHeight, encodedWidth, CV_16UC1);
+                warpAffine(depth, _faceDepth, transform, _faceDepth.size(), INTER_NEAREST);
+            
+            } else {
+                _faceDepth = depth;
+            }
+            _smoothedFaceDepth.create(encodedHeight, encodedWidth, CV_16UC1);
+            
+            // smooth the depth over time
+            const ushort ELEVEN_BIT_MINIMUM = 0;
+            const ushort ELEVEN_BIT_MAXIMUM = 2047;
+            const float DEPTH_SMOOTHING = 0.25f;
+            ushort* src = _faceDepth.ptr<ushort>();
+            ushort* dest = _smoothedFaceDepth.ptr<ushort>();
+            ushort minimumDepth = numeric_limits<ushort>::max();
+            for (int i = 0; i < encodedHeight; i++) {
+                for (int j = 0; j < encodedWidth; j++) {
+                    ushort depth = *src++;
+                    if (depth != ELEVEN_BIT_MINIMUM && depth != ELEVEN_BIT_MAXIMUM) {
+                        minimumDepth = min(minimumDepth, depth);
+                        *dest = (*dest == ELEVEN_BIT_MINIMUM) ? depth : (ushort)glm::mix(depth, *dest, DEPTH_SMOOTHING);
+                    }
+                    dest++;
+                }
+            }
+            const ushort MINIMUM_DEPTH_OFFSET = 64;
+            const float FIXED_MID_DEPTH = 640.0f;
+            float midFaceDepth = (_videoSendMode == FACE_VIDEO) ? (minimumDepth + MINIMUM_DEPTH_OFFSET) : FIXED_MID_DEPTH;
+            
+            // smooth the mid face depth over time
+            const float MID_FACE_DEPTH_SMOOTHING = 0.5f;
+            _smoothedMidFaceDepth = (_smoothedMidFaceDepth == UNINITIALIZED_FACE_DEPTH) ? midFaceDepth :
+                glm::mix(midFaceDepth, _smoothedMidFaceDepth, MID_FACE_DEPTH_SMOOTHING);
+
+            // convert from 11 to 8 bits for preview/local display
+            const uchar EIGHT_BIT_MIDPOINT = 128;
+            double depthOffset = EIGHT_BIT_MIDPOINT - _smoothedMidFaceDepth;
+            depth.convertTo(_grayDepthFrame, CV_8UC1, 1.0, depthOffset);
+
+            // likewise for the encoded representation
+            uchar* yline = vpxImage.planes[0];
+            uchar* vline = vpxImage.planes[1];
+            uchar* uline = vpxImage.planes[2];
+            const uchar EIGHT_BIT_MAXIMUM = 255;
+            for (int i = 0; i < encodedHeight; i += 2) {
+                uchar* ydest = yline;
+                uchar* vdest = vline;
+                uchar* udest = uline;
+                for (int j = 0; j < encodedWidth; j += 2) {
+                    ushort tl = *_smoothedFaceDepth.ptr<ushort>(i, j);
+                    ushort tr = *_smoothedFaceDepth.ptr<ushort>(i, j + 1);
+                    ushort bl = *_smoothedFaceDepth.ptr<ushort>(i + 1, j);
+                    ushort br = *_smoothedFaceDepth.ptr<ushort>(i + 1, j + 1);
+                
+                    uchar mask = EIGHT_BIT_MAXIMUM;
+                    
+                    ydest[0] = (tl == ELEVEN_BIT_MINIMUM) ? (mask = EIGHT_BIT_MIDPOINT) :
+                        saturate_cast<uchar>(tl + depthOffset);
+                    ydest[1] = (tr == ELEVEN_BIT_MINIMUM) ? (mask = EIGHT_BIT_MIDPOINT) :
+                        saturate_cast<uchar>(tr + depthOffset);
+                    ydest[vpxImage.stride[0]] = (bl == ELEVEN_BIT_MINIMUM) ? (mask = EIGHT_BIT_MIDPOINT) :
+                        saturate_cast<uchar>(bl + depthOffset);
+                    ydest[vpxImage.stride[0] + 1] = (br == ELEVEN_BIT_MINIMUM) ? (mask = EIGHT_BIT_MIDPOINT) :
+                        saturate_cast<uchar>(br + depthOffset);
+                    ydest += 2;
+                
+                    *vdest++ = mask;
+                    *udest++ = EIGHT_BIT_MIDPOINT;
+                }
+                yline += vpxImage.stride[0] * 2;
+                vline += vpxImage.stride[1];
+                uline += vpxImage.stride[2];
+            }
+            
+            // encode the frame
+            vpx_codec_encode(&_depthCodec, &vpxImage, _frameCount, 1, 0, VPX_DL_REALTIME);
+
+            // extract the encoded frame
+            vpx_codec_iter_t iterator = 0;
+            const vpx_codec_cx_pkt_t* packet;
+            while ((packet = vpx_codec_get_cx_data(&_depthCodec, &iterator)) != 0) {
+                if (packet->kind == VPX_CODEC_CX_FRAME_PKT) {
+                    payload.append((const char*)packet->data.frame.buf, packet->data.frame.sz);
+                }
+            }
+        }
+    
+        QMetaObject::invokeMethod(Application::getInstance(), "sendAvatarFaceVideoMessage",
+            Q_ARG(int, _frameCount), Q_ARG(QByteArray, payload));
    }
    
-    QMetaObject::invokeMethod(Application::getInstance(), "sendAvatarFaceVideoMessage",
-        Q_ARG(int, _frameCount), Q_ARG(QByteArray, payload));
-
    QMetaObject::invokeMethod(Application::getInstance()->getWebcam(), "setFrame",
        Q_ARG(cv::Mat, color), Q_ARG(int, format), Q_ARG(cv::Mat, _grayDepthFrame), Q_ARG(float, _smoothedMidFaceDepth),
        Q_ARG(cv::RotatedRect, _smoothedFaceRect), Q_ARG(JointVector, joints));
--- a/interface/src/Webcam.h
+++ b/interface/src/Webcam.h
@ -100,16 +100,20 @@ public:

 public slots:
    
+    void cycleVideoSendMode();
    void reset();
    void shutdown();
    void grabFrame();
    
 private:
    
+    enum VideoSendMode { NO_VIDEO, FACE_VIDEO, FULL_FRAME_VIDEO, VIDEO_SEND_MODE_COUNT };
+    
    bool init();
    void updateHSVFrame(const cv::Mat& frame, int format);
    
    bool _initialized;
+    VideoSendMode _videoSendMode;
    CvCapture* _capture;
    cv::CascadeClassifier _faceCascade;
    cv::Mat _hsvFrame;