Android code for getting a snapshot from a RTCMediaStream.
package com.priologic.easyrtcMedia;
import android.util.Base64;
import android.util.Log;
import java.nio.ByteBuffer;
import org.webrtc.VideoTrack;
import org.webrtc.MediaStream;
import org.webrtc.EglBase;
import org.webrtc.RendererCommon;
import javax.microedition.khronos.egl.EGL10;
import javax.microedition.khronos.egl.EGLConfig;
import javax.microedition.khronos.egl.EGLDisplay;
* Created by eric on 11/04/17.
public class EasyrtcSingleFrameCapturer {
public interface BitmapListener {
public void gotBitmap(Bitmap theBitmap);
private static boolean firstTimeOnly = true;
// the below pixelBuffer code is based on from
class PixelBuffer implements org.webrtc.VideoRenderer.Callbacks {
final static String TAG = "PixelBuffer";
final static boolean LIST_CONFIGS = false;
int mWidth, mHeight;
EGLDisplay mEGLDisplay;
boolean gotFrame = false;
String mThreadOwner;
BitmapListener listener; activity;
public PixelBuffer( activity, BitmapListener listener) {
this.listener = listener;
this.activity = activity;
private static final String VERTEX_SHADER_STRING =
"varying vec2 interp_tc;\n"
+ "attribute vec4 in_pos;\n"
+ "attribute vec4 in_tc;\n"
+ "\n"
+ "uniform mat4 texMatrix;\n"
+ "\n"
+ "void main() {\n"
+ " gl_Position = in_pos;\n"
+ " interp_tc = (texMatrix * in_tc).xy;\n"
+ "}\n";
public void renderFrame(final org.webrtc.VideoRenderer.I420Frame i420Frame) {
Log.d(TAG, "entered renderFrame");
// we only want to grab a single frame but our method may get called
// a few times before we're done.
if (gotFrame || i420Frame.width == 0 || i420Frame.height == 0) {
Log.d(TAG, "Already got frame so taking honourable exit");
activity.runOnUiThread(new Runnable() {
public void run() {
int width = i420Frame.width;
int height = i420Frame.height;
Log.d(TAG, "about to call initWithSize");
initWithSize(width, height);
Bitmap bitmap = toBitmap(i420Frame);
gotFrame = true;
private int buildARGB(int r, int g, int b) {
return (0xff << 24) |(r << 16) | (g << 8) | b;
private Bitmap toBitmap(org.webrtc.VideoRenderer.I420Frame frame) {
if (!frame.yuvFrame) {
EglBase eglBase = EglStuff.getEglBase();
if(firstTimeOnly) {
firstTimeOnly = false;
TextureToRGB textureToRGB = new TextureToRGB();
int numPixels = mWidth *mHeight;
final int bytesPerPixel = 4;
ByteBuffer framebuffer = ByteBuffer.allocateDirect(numPixels*bytesPerPixel);
final float frameAspectRatio = (float) frame.rotatedWidth() / (float) frame.rotatedHeight();
final float[] rotatedSamplingMatrix =
RendererCommon.rotateTextureMatrix(frame.samplingMatrix, frame.rotationDegree);
final float[] layoutMatrix = RendererCommon.getLayoutMatrix(
false, frameAspectRatio, (float) mWidth / mHeight);
final float[] texMatrix = RendererCommon.multiplyMatrices(rotatedSamplingMatrix, layoutMatrix);
textureToRGB.convert(framebuffer, mWidth, mHeight, frame.textureId, texMatrix);
byte [] frameBytes = framebuffer.array();
int [] dataARGB = new int[numPixels];
for(int i = 0, j = 0; j < numPixels; i+=bytesPerPixel, j++) {
// data order in frameBytes is red, green, blue, alpha, red, green, ....
dataARGB[j] = buildARGB(frameBytes[i] & 0xff,frameBytes[i+1] &0xff,frameBytes[i+2] &0xff);
Bitmap bitmap = Bitmap.createBitmap(dataARGB, mWidth, mHeight, Bitmap.Config.ARGB_8888);
return bitmap;
else {
return null;
private void initWithSize(final int width, final int height) {
mWidth = width;
mHeight = height;
// Record thread owner of OpenGL context
mThreadOwner = Thread.currentThread().getName();
public void destroy() {
private int getConfigAttrib(final EGLConfig config, final int attribute) {
int[] value = new int[1];
return mEGL.eglGetConfigAttrib(mEGLDisplay, config,
attribute, value) ? value[0] : 0;
final private static String TAG = "frameCapturer";
org.webrtc.VideoRenderer renderer;
private EasyrtcSingleFrameCapturer(final activity, MediaStream mediaStream, final BitmapListener gotFrameListener) {
if( mediaStream.videoTracks.size() == 0) {
Log.e(TAG, "No video track to capture from");
final VideoTrack videoTrack = mediaStream.videoTracks.getFirst();
final PixelBuffer vg = new PixelBuffer(activity, new BitmapListener() {
public void gotBitmap(final Bitmap bitmap) {
activity.runOnUiThread(new Runnable(){
public void run() {
try {
} catch( Exception e1) {
Log.e(TAG, "Exception in gotBitmap callback:" + e1.getMessage());
renderer = new org.webrtc.VideoRenderer(vg);
* This constructor builds an object which captures a frame from mediastream to a Bitmap.
* @param mediaStream The input media mediaStream.
* @param gotFrameListener A callback which will receive the Bitmap.
public static void toBitmap( activity, MediaStream mediaStream, final BitmapListener gotFrameListener) {
new EasyrtcSingleFrameCapturer(activity, mediaStream, gotFrameListener);
* This method captures a frame from the supplied media stream to a jpeg file written to the supplied outputStream.
* @param mediaStream the source media stream
* @param quality the quality of the jpeq 0 to 100.
* @param outputStream the output stream the jpeg file will be written to.
* @param done a runnable that will be invoked when the outputstream has been written to.
* @return The frame capturer. You should keep a reference to the frameCapturer until the done object is invoked.
public static void toOutputStream( activity, MediaStream mediaStream, final int quality, final outputStream, final Runnable done) {
BitmapListener gotFrameListener = new BitmapListener() {
public void gotBitmap(Bitmap theBitmap) {
theBitmap.compress(Bitmap.CompressFormat.JPEG, quality, outputStream);
try {;
} catch( Exception e1) {
Log.e(TAG, "Exception in toOutputStream done callback:" + e1.getMessage());
toBitmap(activity, mediaStream, gotFrameListener);
* This method captures a frame from the supplied mediastream to a dataurl written to a StringBuilder.
* @param mediaStream the source media stream
* @param quality the quality of the jpeq 0 to 100.
* @param output a StringBuilder which will be the recipient of the dataurl.
* @param done a runnable that will be invoked when the dataurl is built.
* @return The frame capturer. You should keep a reference to the frameCapturer until the done object is invoked.
public static void toDataUrl( activity, MediaStream mediaStream, final int quality, final StringBuilder output, final Runnable done) {
final outputStream = new;
Runnable convertToUrl = new Runnable() {
public void run() {
output.append(Base64.encodeToString(outputStream.toByteArray(), Base64.DEFAULT));
try {;
} catch( Exception e1) {
Log.e(TAG, "Exception in toDataUrl done callback:" + e1.getMessage());
toOutputStream(activity, mediaStream, quality, outputStream, convertToUrl);
package com.priologic.easyrtcMedia;
import android.opengl.GLES11Ext;
import android.opengl.GLES20;
import java.nio.ByteBuffer;
import java.nio.FloatBuffer;
import org.webrtc.*;
* Class for converting OES textures RGBA. It should be constructed on a thread with
* an active EGL context, and only be used from that thread. It is used by the EasyrtcSingleFrameCapturer.
class TextureToRGB {
// Vertex coordinates in Normalized Device Coordinates, i.e.
// (-1, -1) is bottom-left and (1, 1) is top-right.
private static final FloatBuffer DEVICE_RECTANGLE = GlUtil.createFloatBuffer(new float[] {
-1.0f, -1.0f, // Bottom left.
1.0f, -1.0f, // Bottom right.
-1.0f, 1.0f, // Top left.
1.0f, 1.0f, // Top right.
// Texture coordinates - (0, 0) is bottom-left and (1, 1) is top-right.
private static final FloatBuffer TEXTURE_RECTANGLE = GlUtil.createFloatBuffer(new float[] {
0.0f, 0.0f, // Bottom left.
1.0f, 0.0f, // Bottom right.
0.0f, 1.0f, // Top left.
1.0f, 1.0f // Top right.
private static final String VERTEX_SHADER =
"varying vec2 interp_tc;\n"
+ "attribute vec4 in_pos;\n"
+ "attribute vec4 in_tc;\n"
+ "\n"
+ "uniform mat4 texMatrix;\n"
+ "\n"
+ "void main() {\n"
+ " gl_Position = in_pos;\n"
+ " interp_tc = (texMatrix * in_tc).xy;\n"
+ "}\n";
private static final String FRAGMENT_SHADER =
"#extension GL_OES_EGL_image_external : require\n"
+ "precision mediump float;\n"
+ "varying vec2 interp_tc;\n"
+ "\n"
+ "uniform samplerExternalOES oesTex;\n"
+ "\n"
+ "void main() {\n"
+ " gl_FragColor = texture2D(oesTex, interp_tc);\n"
+ "}\n";
// clang-format on
private final GlTextureFrameBuffer textureFrameBuffer;
private final GlShader shader;
private final int texMatrixLoc;
private final ThreadUtils.ThreadChecker threadChecker = new ThreadUtils.ThreadChecker();
private boolean released = false;
* This class should be constructed on a thread that has an active EGL context.
public TextureToRGB() {
textureFrameBuffer = new GlTextureFrameBuffer(GLES20.GL_RGBA);
texMatrixLoc = shader.getUniformLocation("texMatrix");
GLES20.glUniform1i(shader.getUniformLocation("oesTex"), 0);
GlUtil.checkNoGLES2Error("Initialize fragment shader uniform values.");
// Initialize vertex shader attributes.
shader.setVertexAttribArray("in_pos", 2, DEVICE_RECTANGLE);
// If the width is not a multiple of 4 pixels, the texture
// will be scaled up slightly and clipped at the right border.
shader.setVertexAttribArray("in_tc", 2, TEXTURE_RECTANGLE);
public void convert(ByteBuffer buf, int width, int height, int srcTextureId,
float[] transformMatrix) {
if (released) {
throw new IllegalStateException("TextureToRGB.convert called on released object");
int size = width * height;
if (buf.capacity() < size) {
throw new IllegalArgumentException("TextureToRGB.convert called with too small buffer");
// Produce a frame buffer starting at top-left corner, not
// bottom-left.
transformMatrix =
RendererCommon.multiplyMatrices(transformMatrix, RendererCommon.verticalFlipMatrix());
final int frameBufferWidth = width;
final int frameBufferHeight =height;
textureFrameBuffer.setSize(frameBufferWidth, frameBufferHeight);
// Bind our framebuffer.
GLES20.glBindFramebuffer(GLES20.GL_FRAMEBUFFER, textureFrameBuffer.getFrameBufferId());
GLES20.glBindTexture(GLES11Ext.GL_TEXTURE_EXTERNAL_OES, srcTextureId);
GLES20.glUniformMatrix4fv(texMatrixLoc, 1, false, transformMatrix, 0);
GLES20.glViewport(0, 0, width, height);
GLES20.glDrawArrays(GLES20.GL_TRIANGLE_STRIP, 0, 4);
0, 0, frameBufferWidth, frameBufferHeight, GLES20.GL_RGBA, GLES20.GL_UNSIGNED_BYTE, buf);
// Restore normal framebuffer.
GLES20.glBindFramebuffer(GLES20.GL_FRAMEBUFFER, 0);
GLES20.glBindTexture(GLES20.GL_TEXTURE_2D, 0);
// Unbind texture. Reportedly needed on some devices to get
// the texture updated from the camera.
public void release() {
released = true;
I try to use your code, but i have a issue the first time toBitmap method is called, it take very long time
I have found that the long time comes from the for loop calling the buildARGB method between the lines 123 and 128 :
for(int i = 0, j = 0; j < numPixels; i+=bytesPerPixel, j++) {
// data order in frameBytes is red, green, blue, alpha, red, green, ....
dataARGB[j] = buildARGB(frameBytes[i] & 0xff,frameBytes[i+1] &0xff,frameBytes[i+2] &0xff);

Here are some bench of this loop :

  • the first time : loop for 418176 pixels in 2750 ms
  • the other times : loop for 418176 pixels in 49 ms

Have you seen this problem ? Do you know how to manage it ?
Thank you

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment