1 files changed, 1035 insertions, 0 deletions
diff --git a/trunk/channels/console_video.c b/trunk/channels/console_video.c
new file mode 100644
index 000000000..554d03c39
--- /dev/null
+++ b/trunk/channels/console_video.c
@@ -0,0 +1,1035 @@
+/*
+ * Asterisk -- An open source telephony toolkit.
+ *
+ * Copyright 2007-2008, Marta Carbone, Sergio Fadda, Luigi Rizzo
+ *
+ * See http://www.asterisk.org for more information about
+ * the Asterisk project. Please do not directly contact
+ * any of the maintainers of this project for assistance;
+ * the project provides a web site, mailing lists and IRC
+ * channels for your use.
+ *
+ * This program is free software, distributed under the terms of
+ * the GNU General Public License Version 2. See the LICENSE file
+ * at the top of the source tree.
+ */
+
+/*
+ * Experimental support for video sessions. We use SDL for rendering, ffmpeg
+ * as the codec library for encoding and decoding, and Video4Linux and X11
+ * to generate the local video stream.
+ *
+ * If one of these pieces is not available, either at compile time or at
+ * runtime, we do our best to run without it. Of course, no codec library
+ * means we can only deal with raw data, no SDL means we cannot do rendering,
+ * no V4L or X11 means we cannot generate data (but in principle we could
+ * stream from or record to a file).
+ *
+ * We need a recent (2007.07.12 or newer) version of ffmpeg to avoid warnings.
+ * Older versions might give 'deprecated' messages during compilation,
+ * thus not compiling in AST_DEVMODE, or don't have swscale, in which case
+ * you can try to compile #defining OLD_FFMPEG here.
+ *
+ * $Revision$
+ */
+
+//#define DROP_PACKETS 5       /* if set, drop this % of video packets */
+//#define OLD_FFMPEG	1	/* set for old ffmpeg with no swscale */
+
+#include "asterisk.h"
+ASTERISK_FILE_VERSION(__FILE__, "$Revision$")
+#include <sys/ioctl.h>
+#include "asterisk/cli.h"
+#include "asterisk/file.h"
+#include "asterisk/channel.h"
+
+#include "console_video.h"
+
+/*
+The code is structured as follows.
+
+When a new console channel is created, we call console_video_start()
+to initialize SDL, the source, and the encoder/ decoder for the
+formats in use (XXX the latter two should be done later, once the
+codec negotiation is complete).  Also, a thread is created to handle
+the video source and generate frames.
+
+While communication is on, the local source is generated by the
+video thread, which wakes up periodically, generates frames and
+enqueues them in chan->readq.  Incoming rtp frames are passed to
+console_write_video(), decoded and passed to SDL for display.
+
+For as unfortunate and confusing as it can be, we need to deal with a
+number of different video representations (size, codec/pixel format,
+codec parameters), as follows:
+
+ loc_src	is the data coming from the camera/X11/etc.
+	The format is typically constrained by the video source.
+
+ enc_in		is the input required by the encoder.
+	Typically constrained in size by the encoder type.
+
+ enc_out	is the bitstream transmitted over RTP.
+	Typically negotiated while the call is established.
+
+ loc_dpy	is the format used to display the local video source.
+	Depending on user preferences this can have the same size as
+	loc_src_fmt, or enc_in_fmt, or thumbnail size (e.g. PiP output)
+
+ dec_in		is the incoming RTP bitstream. Negotiated
+	during call establishment, it is not necessarily the same as
+	enc_in_fmt
+
+ dec_out	the output of the decoder.
+	The format is whatever the other side sends, and the
+	buffer is allocated by avcodec_decode_... so we only
+	copy the data here.
+
+ rem_dpy	the format used to display the remote stream
+
+We store the format info together with the buffer storing the data.
+As a future optimization, a format/buffer may reference another one
+if the formats are equivalent. This will save some unnecessary format
+conversion.
+
+
+In order to handle video you need to add to sip.conf (and presumably
+iax.conf too) the following:
+
+	[general](+)
+		videosupport=yes
+		allow=h263	; this or other video formats
+		allow=h263p	; this or other video formats
+
+ */
+
+/*
+ * Codecs are absolutely necessary or we cannot do anything.
+ * SDL is optional (used for rendering only), so that we can still
+ * stream video withouth displaying it.
+ */
+#if !defined(HAVE_VIDEO_CONSOLE) || !defined(HAVE_FFMPEG)
+/* stubs if required pieces are missing */
+int console_write_video(struct ast_channel *chan, struct ast_frame *f)
+{
+	return 0;	/* writing video not supported */
+}
+
+int console_video_cli(struct video_desc *env, const char *var, int fd)
+{
+	return 1;	/* nothing matched */
+}
+
+int console_video_config(struct video_desc **penv, const char *var, const char *val)
+{
+	return 1;	/* no configuration */
+}
+
+void console_video_start(struct video_desc *env, struct ast_channel *owner)
+{
+	ast_log(LOG_NOTICE, "voice only, console video support not present\n");
+}
+
+void console_video_uninit(struct video_desc *env)
+{
+}
+
+int console_video_formats = 0;
+
+#else /* defined(HAVE_FFMPEG) && defined(HAVE_SDL) */
+
+/*! The list of video formats we support. */
+int console_video_formats = 
+	AST_FORMAT_H263_PLUS | AST_FORMAT_H263 |
+	AST_FORMAT_MP4_VIDEO | AST_FORMAT_H264 | AST_FORMAT_H261 ;
+
+
+
+static void my_scale(struct fbuf_t *in, AVPicture *p_in,
+	struct fbuf_t *out, AVPicture *p_out);
+
+struct video_codec_desc;	/* forward declaration */
+/*
+ * Descriptor of the local source, made of the following pieces:
+ *  + configuration info (geometry, device name, fps...). These are read
+ *    from the config file and copied here before calling video_out_init();
+ *  + the frame buffer (buf) and source pixel format, allocated at init time;
+ *  + the encoding and RTP info, including timestamps to generate
+ *    frames at the correct rate;
+ *  + source-specific info, i.e. fd for /dev/video, dpy-image for x11, etc,
+ *    filled in by grabber_open
+ * NOTE: loc_src.data == NULL means the rest of the struct is invalid, and
+ *	the video source is not available.
+ */
+struct video_out_desc {
+	/* video device support.
+	 * videodevice and geometry are read from the config file.
+	 * At the right time we try to open it and allocate a buffer.
+	 * If we are successful, webcam_bufsize > 0 and we can read.
+	 */
+	/* all the following is config file info copied from the parent */
+	char		videodevice[64];
+	int		fps;
+	int		bitrate;
+	int		qmin;
+
+	int sendvideo;
+
+	struct fbuf_t	loc_src_geometry;	/* local source geometry only (from config file) */
+	struct fbuf_t	enc_out;	/* encoder output buffer, allocated in video_out_init() */
+
+	struct video_codec_desc *enc;	/* encoder */
+	void		*enc_ctx;	/* encoding context */
+	AVCodec		*codec;
+	AVFrame		*enc_in_frame;	/* enc_in mapped into avcodec format. */
+					/* The initial part of AVFrame is an AVPicture */
+	int		mtu;
+	struct timeval	last_frame;	/* when we read the last frame ? */
+
+	struct grab_desc *grabber;
+	void		*grabber_data;
+};
+
+/*
+ * The overall descriptor, with room for config info, video source and
+ * received data descriptors, SDL info, etc.
+ * This should be globally visible to all modules (grabber, vcodecs, gui)
+ * and contain all configurtion info.
+ */
+struct video_desc {
+	char			codec_name[64];	/* the codec we use */
+
+	int			stayopen;	/* set if gui starts manually */
+	pthread_t		vthread;	/* video thread */
+	ast_mutex_t		dec_lock;	/* sync decoder and video thread */
+	int			shutdown;	/* set to shutdown vthread */
+	struct ast_channel	*owner;		/* owner channel */
+
+
+	struct fbuf_t	enc_in;		/* encoder input buffer, allocated in video_out_init() */
+
+	char			keypad_file[256];	/* image for the keypad */
+	char                    keypad_font[256];       /* font for the keypad */
+
+	char			sdl_videodriver[256];
+
+	struct fbuf_t		rem_dpy;	/* display remote video, no buffer (it is in win[WIN_REMOTE].bmp) */
+	struct fbuf_t		loc_dpy;	/* display local source, no buffer (managed by SDL in bmp[1]) */
+
+
+	/* local information for grabbers, codecs, gui */
+	struct gui_info		*gui;
+	struct video_dec_desc	*in;		/* remote video descriptor */
+	struct video_out_desc	out;		/* local video descriptor */
+};
+
+static AVPicture *fill_pict(struct fbuf_t *b, AVPicture *p);
+
+void fbuf_free(struct fbuf_t *b)
+{
+	struct fbuf_t x = *b;
+
+	if (b->data && b->size)
+		ast_free(b->data);
+	bzero(b, sizeof(*b));
+	/* restore some fields */
+	b->w = x.w;
+	b->h = x.h;
+	b->pix_fmt = x.pix_fmt;
+}
+
+#include "vcodecs.c"
+#include "console_gui.c"
+
+/*! \brief Try to open a video source, return 0 on success, 1 on error */
+static int grabber_open(struct video_out_desc *v)
+{
+	struct grab_desc *g;
+	void *g_data;
+	int i;
+
+	for (i = 0; (g = console_grabbers[i]); i++) {
+		g_data = g->open(v->videodevice, &v->loc_src_geometry, v->fps);
+		if (g_data) {
+			v->grabber = g;
+			v->grabber_data = g_data;
+			return 0;
+		}
+	}
+	return 1; /* no source found */
+}
+
+/*! \brief complete a buffer from the local video source.
+ * Called by get_video_frames(), in turn called by the video thread.
+ */
+static struct fbuf_t *grabber_read(struct video_out_desc *v)
+{
+	struct timeval now = ast_tvnow();
+
+	if (v->grabber == NULL) /* not initialized */
+		return 0;
+
+	/* check if it is time to read */
+	if (ast_tvzero(v->last_frame))
+		v->last_frame = now;
+	if (ast_tvdiff_ms(now, v->last_frame) < 1000/v->fps)
+		return 0;	/* too early */
+	v->last_frame = now; /* XXX actually, should correct for drift */
+	return v->grabber->read(v->grabber_data);
+}
+
+/*! \brief handler run when dragging with the left button on
+ * the local source window - the effect is to move the offset
+ * of the captured area.
+ */
+static void grabber_move(struct video_out_desc *v, int dx, int dy)
+{
+	if (v->grabber && v->grabber->move)
+                v->grabber->move(v->grabber_data, dx, dy);
+}
+
+/*
+ * Map the codec name to the library. If not recognised, use a default.
+ * This is useful in the output path where we decide by name, presumably.
+ */
+static struct video_codec_desc *map_config_video_format(char *name)
+{
+	int i;
+
+	for (i = 0; supported_codecs[i]; i++)
+		if (!strcasecmp(name, supported_codecs[i]->name))
+			break;
+	if (supported_codecs[i] == NULL) {
+		ast_log(LOG_WARNING, "Cannot find codec for '%s'\n", name);
+		i = 0;
+		strcpy(name, supported_codecs[i]->name);
+	}
+	ast_log(LOG_WARNING, "Using codec '%s'\n", name);
+	return supported_codecs[i];
+}
+
+
+/*! \brief uninitialize the descriptor for local video stream */
+static int video_out_uninit(struct video_desc *env)
+{
+	struct video_out_desc *v = &env->out;
+
+	/* XXX this should be a codec callback */
+	if (v->enc_ctx) {
+		AVCodecContext *enc_ctx = (AVCodecContext *)v->enc_ctx;
+		avcodec_close(enc_ctx);
+		av_free(enc_ctx);
+		v->enc_ctx = NULL;
+	}
+	if (v->enc_in_frame) {
+		av_free(v->enc_in_frame);
+		v->enc_in_frame = NULL;
+	}
+	v->codec = NULL;	/* nothing to free, this is only a reference */
+	/* release the buffers */
+	fbuf_free(&env->enc_in);
+	fbuf_free(&v->enc_out);
+	/* close the grabber */
+	if (v->grabber) {
+		v->grabber_data = v->grabber->close(v->grabber_data);
+		v->grabber = NULL;
+	}
+	return -1;
+}
+
+/*
+ * Initialize the encoder for the local source:
+ * - enc_ctx, codec, enc_in_frame are used by ffmpeg for encoding;
+ * - enc_out is used to store the encoded frame (to be sent)
+ * - mtu is used to determine the max size of video fragment
+ * NOTE: we enter here with the video source already open.
+ */
+static int video_out_init(struct video_desc *env)
+{
+	int codec;
+	int size;
+	struct fbuf_t *enc_in;
+	struct video_out_desc *v = &env->out;
+
+	v->enc_ctx		= NULL;
+	v->codec		= NULL;
+	v->enc_in_frame		= NULL;
+	v->enc_out.data		= NULL;
+
+	codec = map_video_format(v->enc->format, CM_WR);
+	v->codec = avcodec_find_encoder(codec);
+	if (!v->codec) {
+		ast_log(LOG_WARNING, "Cannot find the encoder for format %d\n",
+			codec);
+		return -1;	/* error, but nothing to undo yet */
+	}
+
+	v->mtu = 1400;	/* set it early so the encoder can use it */
+
+	/* allocate the input buffer for encoding.
+	 * ffmpeg only supports PIX_FMT_YUV420P for the encoding.
+	 */
+	enc_in = &env->enc_in;
+	enc_in->pix_fmt = PIX_FMT_YUV420P;
+	enc_in->size = (enc_in->w * enc_in->h * 3)/2;
+	enc_in->data = ast_calloc(1, enc_in->size);
+	if (!enc_in->data) {
+		ast_log(LOG_WARNING, "Cannot allocate encoder input buffer\n");
+		return video_out_uninit(env);
+	}
+	/* construct an AVFrame that points into buf_in */
+	v->enc_in_frame = avcodec_alloc_frame();
+	if (!v->enc_in_frame) {
+		ast_log(LOG_WARNING, "Unable to allocate the encoding video frame\n");
+		return video_out_uninit(env);
+	}
+
+	/* parameters for PIX_FMT_YUV420P */
+	size = enc_in->w * enc_in->h;
+	v->enc_in_frame->data[0] = enc_in->data;
+	v->enc_in_frame->data[1] = v->enc_in_frame->data[0] + size;
+	v->enc_in_frame->data[2] = v->enc_in_frame->data[1] + size/4;
+	v->enc_in_frame->linesize[0] = enc_in->w;
+	v->enc_in_frame->linesize[1] = enc_in->w/2;
+	v->enc_in_frame->linesize[2] = enc_in->w/2;
+
+	/* now setup the parameters for the encoder.
+	 * XXX should be codec-specific
+	 */
+    {
+	AVCodecContext *enc_ctx = avcodec_alloc_context();
+	v->enc_ctx = enc_ctx;
+	enc_ctx->pix_fmt = enc_in->pix_fmt;
+	enc_ctx->width = enc_in->w;
+	enc_ctx->height = enc_in->h;
+	/* XXX rtp_callback ?
+	 * rtp_mode so ffmpeg inserts as many start codes as possible.
+	 */
+	enc_ctx->rtp_mode = 1;
+	enc_ctx->rtp_payload_size = v->mtu / 2; // mtu/2
+	enc_ctx->bit_rate = v->bitrate;
+	enc_ctx->bit_rate_tolerance = enc_ctx->bit_rate/2;
+	enc_ctx->qmin = v->qmin;	/* should be configured */
+	enc_ctx->time_base = (AVRational){1, v->fps};
+	enc_ctx->gop_size = v->fps*5; // emit I frame every 5 seconds
+
+	v->enc->enc_init(v->enc_ctx);
+ 
+	if (avcodec_open(enc_ctx, v->codec) < 0) {
+		ast_log(LOG_WARNING, "Unable to initialize the encoder %d\n",
+			codec);
+		av_free(enc_ctx);
+		v->enc_ctx = NULL;
+		return video_out_uninit(env);
+	}
+    }
+	/*
+	 * Allocate enough for the encoded bitstream. As we are compressing,
+	 * we hope that the output is never larger than the input size.
+	 */
+	v->enc_out.data = ast_calloc(1, enc_in->size);
+	v->enc_out.size = enc_in->size;
+	v->enc_out.used = 0;
+
+	return 0;
+}
+
+/*! \brief possibly uninitialize the video console.
+ * Called at the end of a call, should reset the 'owner' field,
+ * then possibly terminate the video thread if the gui has
+ * not been started manually.
+ * In practice, signal the thread and give it a bit of time to
+ * complete, giving up if it gets stuck. Because uninit
+ * is called from hangup with the channel locked, and the thread
+ * uses the chan lock, we need to unlock here. This is unsafe,
+ * and we should really use refcounts for the channels.
+ */
+void console_video_uninit(struct video_desc *env)
+{
+	int i, t = 100;	/* initial wait is shorter, than make it longer */
+	if (env->stayopen == 0) {	/* in a call */
+		env->shutdown = 1;
+		for (i=0; env->shutdown && i < 10; i++) {
+			if (env->owner)
+				ast_channel_unlock(env->owner);
+			usleep(t);
+			t = 1000000;
+			if (env->owner)
+				ast_channel_lock(env->owner);
+		}
+	}
+	env->owner = NULL;	/* this is unconditional */
+}
+
+/*! fill an AVPicture from our fbuf info, as it is required by
+ * the image conversion routines in ffmpeg.
+ * XXX This depends on the format.
+ */
+static AVPicture *fill_pict(struct fbuf_t *b, AVPicture *p)
+{
+	/* provide defaults for commonly used formats */
+	int l4 = b->w * b->h/4; /* size of U or V frame */
+	int len = b->w;		/* Y linesize, bytes */
+	int luv = b->w/2;	/* U/V linesize, bytes */
+
+	bzero(p, sizeof(*p));
+	switch (b->pix_fmt) {
+	case PIX_FMT_RGB555:
+	case PIX_FMT_RGB565:
+		len *= 2;
+		luv = 0;
+		break;
+	case PIX_FMT_RGBA32:
+		len *= 4;
+		luv = 0;
+		break;
+	case PIX_FMT_YUYV422:	/* Packed YUV 4:2:2, 16bpp, Y0 Cb Y1 Cr */
+		len *= 2;	/* all data in first plane, probably */
+		luv = 0;
+		break;
+	}
+	p->data[0] = b->data;
+	p->linesize[0] = len;
+	/* these are only valid for component images */
+	p->data[1] = luv ? b->data + 4*l4 : b->data+len;
+	p->data[2] = luv ? b->data + 5*l4 : b->data+len;
+	p->linesize[1] = luv;
+	p->linesize[2] = luv;
+	return p;
+}
+
+/*! convert/scale between an input and an output format.
+ * Old version of ffmpeg only have img_convert, which does not rescale.
+ * New versions use sws_scale which does both.
+ */
+static void my_scale(struct fbuf_t *in, AVPicture *p_in,
+	struct fbuf_t *out, AVPicture *p_out)
+{
+	AVPicture my_p_in, my_p_out;
+
+	if (p_in == NULL)
+		p_in = fill_pict(in, &my_p_in);
+	if (p_out == NULL)
+		p_out = fill_pict(out, &my_p_out);
+
+#ifdef OLD_FFMPEG
+	/* XXX img_convert is deprecated, and does not do rescaling */
+	img_convert(p_out, out->pix_fmt,
+		p_in, in->pix_fmt, in->w, in->h);
+#else /* XXX replacement */
+    {
+	struct SwsContext *convert_ctx;
+
+	convert_ctx = sws_getContext(in->w, in->h, in->pix_fmt,
+		out->w, out->h, out->pix_fmt,
+		SWS_BICUBIC, NULL, NULL, NULL);
+	if (convert_ctx == NULL) {
+		ast_log(LOG_ERROR, "FFMPEG::convert_cmodel : swscale context initialization failed");
+		return;
+	}
+	if (0)
+		ast_log(LOG_WARNING, "in %d %dx%d out %d %dx%d\n",
+			in->pix_fmt, in->w, in->h, out->pix_fmt, out->w, out->h);
+	sws_scale(convert_ctx,
+		p_in->data, p_in->linesize,
+		in->w, in->h, /* src slice */
+		p_out->data, p_out->linesize);
+
+	sws_freeContext(convert_ctx);
+    }
+#endif /* XXX replacement */
+}
+
+struct video_desc *get_video_desc(struct ast_channel *c);
+
+/*
+ * This function is called (by asterisk) for each video packet
+ * coming from the network (the 'in' path) that needs to be processed.
+ * We need to reconstruct the entire video frame before we can decode it.
+ * After a video packet is received we have to:
+ * - extract the bitstream with pre_process_data()
+ * - append the bitstream to a buffer
+ * - if the fragment is the last (RTP Marker) we decode it with decode_video()
+ * - after the decoding is completed we display the decoded frame with show_frame()
+ */
+int console_write_video(struct ast_channel *chan, struct ast_frame *f);
+int console_write_video(struct ast_channel *chan, struct ast_frame *f)
+{
+	struct video_desc *env = get_video_desc(chan);
+	struct video_dec_desc *v = env->in;
+
+	if (!env->gui)	/* no gui, no rendering */
+		return 0;
+	if (v == NULL)
+		env->in = v = dec_init(f->subclass & ~1);
+	if (v == NULL) {
+		/* This is not fatal, but we won't have incoming video */
+		ast_log(LOG_WARNING, "Cannot initialize input decoder\n");
+		return 0;
+	}
+
+	if (v->dec_in_cur == NULL)	/* no buffer for incoming frames, drop */
+		return 0;
+#if defined(DROP_PACKETS) && DROP_PACKETS > 0
+	/* Simulate lost packets */
+	if ((random() % 10000) <= 100*DROP_PACKETS) {
+		ast_log(LOG_NOTICE, "Packet lost [%d]\n", f->seqno);
+		return 0;
+	}
+#endif
+	if (v->discard) {
+		/*
+		 * In discard mode, drop packets until we find one with
+		 * the RTP marker set (which is the end of frame).
+		 * Note that the RTP marker flag is sent as the LSB of the
+		 * subclass, which is a  bitmask of formats. The low bit is
+		 * normally used for audio so there is no interference.
+		 */
+		if (f->subclass & 0x01) {
+			v->dec_in_cur->used = 0;
+			v->dec_in_cur->ebit = 0;
+			v->next_seq = f->seqno + 1;	/* wrap at 16 bit */
+			v->discard = 0;
+			ast_log(LOG_WARNING, "out of discard mode, frame %d\n", f->seqno);
+		}
+		return 0;
+	}
+
+	/*
+	 * Only in-order fragments will be accepted. Remember seqno
+	 * has 16 bit so there is wraparound. Also, ideally we could
+	 * accept a bit of reordering, but at the moment we don't.
+	 */
+	if (v->next_seq != f->seqno) {
+		ast_log(LOG_WARNING, "discarding frame out of order, %d %d\n",
+			v->next_seq, f->seqno);
+		v->discard = 1;
+		return 0;
+	}
+	v->next_seq++;
+
+	if (f->data == NULL || f->datalen < 2) {
+		ast_log(LOG_WARNING, "empty video frame, discard\n");
+		return 0;
+	}
+	if (v->d_callbacks->dec_decap(v->dec_in_cur, f->data, f->datalen)) {
+		ast_log(LOG_WARNING, "error in dec_decap, enter discard\n");
+		v->discard = 1;
+	}
+	if (f->subclass & 0x01) {	// RTP Marker
+		/* prepare to decode: advance the buffer so the video thread knows. */
+		struct fbuf_t *tmp = v->dec_in_cur;	/* store current pointer */
+		ast_mutex_lock(&env->dec_lock);
+		if (++v->dec_in_cur == &v->dec_in[N_DEC_IN])	/* advance to next, circular */
+			v->dec_in_cur = &v->dec_in[0];
+		if (v->dec_in_dpy == NULL) {	/* were not displaying anything, so set it */
+			v->dec_in_dpy = tmp;
+		} else if (v->dec_in_dpy == v->dec_in_cur) { /* current slot is busy */
+			v->dec_in_cur = NULL;
+		}
+		ast_mutex_unlock(&env->dec_lock);
+	}
+	return 0;
+}
+
+
+/*! \brief read a frame from webcam or X11 through grabber_read(),
+ * display it,  then encode and split it.
+ * Return a list of ast_frame representing the video fragments.
+ * The head pointer is returned by the function, the tail pointer
+ * is returned as an argument.
+ */
+static struct ast_frame *get_video_frames(struct video_desc *env, struct ast_frame **tail)
+{
+	struct video_out_desc *v = &env->out;
+	struct ast_frame *dummy;
+	struct fbuf_t *loc_src = grabber_read(v);
+
+	if (!loc_src)
+		return NULL;	/* can happen, e.g. we are reading too early */
+
+	if (tail == NULL)
+		tail = &dummy;
+	*tail = NULL;
+	/* Scale the video for the encoder, then use it for local rendering
+	 * so we will see the same as the remote party.
+	 */
+	my_scale(loc_src, NULL, &env->enc_in, NULL);
+	show_frame(env, WIN_LOCAL);
+	if (!v->sendvideo)
+		return NULL;
+	if (v->enc_out.data == NULL) {
+		static volatile int a = 0;
+		if (a++ < 2)
+			ast_log(LOG_WARNING, "fail, no encoder output buffer\n");
+		return NULL;
+	}
+	v->enc->enc_run(v);
+	return v->enc->enc_encap(&v->enc_out, v->mtu, tail);
+}
+
+/*
+ * Helper thread to periodically poll the video source and enqueue the
+ * generated frames to the channel's queue.
+ * Using a separate thread also helps because the encoding can be
+ * computationally expensive so we don't want to starve the main thread.
+ */
+static void *video_thread(void *arg)
+{
+	struct video_desc *env = arg;
+	int count = 0;
+	char save_display[128] = "";
+
+	/* if sdl_videodriver is set, override the environment. Also,
+	 * if it contains 'console' override DISPLAY around the call to SDL_Init
+	 * so we use the console as opposed to the x11 version of aalib
+	 */
+	if (!ast_strlen_zero(env->sdl_videodriver)) { /* override */
+		const char *s = getenv("DISPLAY");
+		setenv("SDL_VIDEODRIVER", env->sdl_videodriver, 1);
+		if (s && !strcasecmp(env->sdl_videodriver, "aalib-console")) {
+			ast_copy_string(save_display, s, sizeof(save_display));
+			unsetenv("DISPLAY");
+		}
+	}
+	sdl_setup(env);
+	if (!ast_strlen_zero(save_display))
+		setenv("DISPLAY", save_display, 1);
+
+        /* initialize grab coordinates */
+        env->out.loc_src_geometry.x = 0;
+        env->out.loc_src_geometry.y = 0;
+
+	ast_mutex_init(&env->dec_lock);	/* used to sync decoder and renderer */
+
+	if (grabber_open(&env->out)) {
+		ast_log(LOG_WARNING, "cannot open local video source\n");
+	} else {
+#if 0
+		/* In principle, try to register the fd.
+		 * In practice, many webcam drivers do not support select/poll,
+		 * so don't bother and instead read periodically from the
+		 * video thread.
+		 */
+		if (env->out.fd >= 0)
+			ast_channel_set_fd(env->owner, 1, env->out.fd);
+#endif
+		video_out_init(env);
+	}
+
+	for (;;) {
+		struct timeval t = { 0, 50000 };	/* XXX 20 times/sec */
+		struct ast_frame *p, *f;
+		struct ast_channel *chan;
+		int fd;
+		char *caption = NULL, buf[160];
+
+		/* determine if video format changed */
+		if (count++ % 10 == 0) {
+			if (env->out.sendvideo)
+			    sprintf(buf, "%s %s %dx%d @@ %dfps %dkbps",
+				env->out.videodevice, env->codec_name,
+				env->enc_in.w, env->enc_in.h,
+				env->out.fps, env->out.bitrate/1000);
+			else
+			    sprintf(buf, "hold");
+			caption = buf;
+		}
+
+		/* manage keypad events */
+		/* XXX here we should always check for events,
+		* otherwise the drag will not work */ 
+		if (env->gui)
+			eventhandler(env, caption);
+ 
+		/* sleep for a while */
+		ast_select(0, NULL, NULL, NULL, &t);
+
+	    if (env->in) {
+		struct video_dec_desc *v = env->in;
+		
+		/*
+		 * While there is something to display, call the decoder and free
+		 * the buffer, possibly enabling the receiver to store new data.
+		 */
+		while (v->dec_in_dpy) {
+			struct fbuf_t *tmp = v->dec_in_dpy;	/* store current pointer */
+
+			if (v->d_callbacks->dec_run(v, tmp))
+				show_frame(env, WIN_REMOTE);
+			tmp->used = 0;	/* mark buffer as free */
+			tmp->ebit = 0;
+			ast_mutex_lock(&env->dec_lock);
+			if (++v->dec_in_dpy == &v->dec_in[N_DEC_IN])	/* advance to next, circular */
+				v->dec_in_dpy = &v->dec_in[0];
+
+			if (v->dec_in_cur == NULL)	/* receiver was idle, enable it... */
+				v->dec_in_cur = tmp;	/* using the slot just freed */
+			else if (v->dec_in_dpy == v->dec_in_cur) /* this was the last slot */
+				v->dec_in_dpy = NULL;	/* nothing more to display */
+			ast_mutex_unlock(&env->dec_lock);
+		}
+	    }
+
+		if (env->shutdown)
+			break;
+		f = get_video_frames(env, &p);	/* read and display */
+		if (!f)
+			continue;
+		chan = env->owner;
+		if (chan == NULL)
+			continue;
+		fd = chan->alertpipe[1];
+		ast_channel_lock(chan);
+
+		/* AST_LIST_INSERT_TAIL is only good for one frame, cannot use here */
+		if (chan->readq.first == NULL) {
+			chan->readq.first = f;
+		} else {
+			chan->readq.last->frame_list.next = f;
+		}
+		chan->readq.last = p;
+		/*
+		 * more or less same as ast_queue_frame, but extra
+		 * write on the alertpipe to signal frames.
+		 */
+		if (fd > -1) {
+			int blah = 1, l = sizeof(blah);
+			for (p = f; p; p = AST_LIST_NEXT(p, frame_list)) {
+				if (write(fd, &blah, l) != l)
+					ast_log(LOG_WARNING, "Unable to write to alert pipe on %s, frametype/subclass %d/%d: %s!\n",
+					    chan->name, f->frametype, f->subclass, strerror(errno));
+			}
+		}
+		ast_channel_unlock(chan);
+	}
+	/* thread terminating, here could call the uninit */
+	/* uninitialize the local and remote video environments */
+	env->in = dec_uninit(env->in);
+	video_out_uninit(env);
+
+	if (env->gui)
+		env->gui = cleanup_sdl(env->gui);
+	ast_mutex_destroy(&env->dec_lock);
+	env->shutdown = 0;
+	return NULL;
+}
+
+static void copy_geometry(struct fbuf_t *src, struct fbuf_t *dst)
+{
+	if (dst->w == 0)
+		dst->w = src->w;
+	if (dst->h == 0)
+		dst->h = src->h;
+}
+
+/*! initialize the video environment.
+ * Apart from the formats (constant) used by sdl and the codec,
+ * we use enc_in as the basic geometry.
+ */
+static void init_env(struct video_desc *env)
+{
+	struct fbuf_t *c = &(env->out.loc_src_geometry);		/* local source */
+	struct fbuf_t *ei = &(env->enc_in);		/* encoder input */
+	struct fbuf_t *ld = &(env->loc_dpy);	/* local display */
+	struct fbuf_t *rd = &(env->rem_dpy);		/* remote display */
+
+	c->pix_fmt = PIX_FMT_YUV420P;	/* default - camera format */
+	ei->pix_fmt = PIX_FMT_YUV420P;	/* encoder input */
+	if (ei->w == 0 || ei->h == 0) {
+		ei->w = 352;
+		ei->h = 288;
+	}
+	ld->pix_fmt = rd->pix_fmt = PIX_FMT_YUV420P; /* sdl format */
+	/* inherit defaults */
+	copy_geometry(ei, c);	/* camera inherits from encoder input */
+	copy_geometry(ei, rd);	/* remote display inherits from encoder input */
+	copy_geometry(rd, ld);	/* local display inherits from remote display */
+}
+
+/*!
+ * The first call to the video code, called by oss_new() or similar.
+ * Here we initialize the various components we use, namely SDL for display,
+ * ffmpeg for encoding/decoding, and a local video source.
+ * We do our best to progress even if some of the components are not
+ * available.
+ */
+void console_video_start(struct video_desc *env, struct ast_channel *owner)
+{
+	ast_log(LOG_WARNING, "env %p chan %p\n", env, owner);
+	if (env == NULL)	/* video not initialized */
+		return;
+	env->owner = owner;	/* work even if no owner is specified */
+	if (env->stayopen)
+		return;		/* already initialized, nothing to do */
+	init_env(env);
+	env->out.enc = map_config_video_format(env->codec_name);
+
+	ast_log(LOG_WARNING, "start video out %s %dx%d\n",
+		env->codec_name, env->enc_in.w,  env->enc_in.h);
+	/*
+	 * Register all codecs supported by the ffmpeg library.
+	 * We only need to do it once, but probably doesn't
+	 * harm to do it multiple times.
+	 */
+	avcodec_init();
+	avcodec_register_all();
+	av_log_set_level(AV_LOG_ERROR);	/* only report errors */
+
+	if (env->out.fps == 0) {
+		env->out.fps = 15;
+		ast_log(LOG_WARNING, "fps unset, forcing to %d\n", env->out.fps);
+	}
+	if (env->out.bitrate == 0) {
+		env->out.bitrate = 65000;
+		ast_log(LOG_WARNING, "bitrate unset, forcing to %d\n", env->out.bitrate);
+	}
+	ast_pthread_create_background(&env->vthread, NULL, video_thread, env);
+	if (env->owner == NULL)
+		env->stayopen = 1;	/* manually opened so don't close on hangup */
+}
+
+/*
+ * Parse a geometry string, accepting also common names for the formats.
+ * Trick: if we have a leading > or < and a numeric geometry,
+ * return the larger or smaller one.
+ * E.g. <352x288 gives the smaller one, 320x240
+ */
+static int video_geom(struct fbuf_t *b, const char *s)
+{
+	int w = 0, h = 0;
+
+	static struct {
+		const char *s; int w; int h;
+	} *fp, formats[] = {
+		{"16cif",	1408, 1152 },
+		{"xga",		1024, 768 },
+		{"4cif",	704, 576 },
+		{"vga",		640, 480 },
+		{"cif",		352, 288 },
+		{"qvga",	320, 240 },
+		{"qcif",	176, 144 },
+		{"sqcif",	128, 96 },
+		{NULL,		0, 0 },
+	};
+	if (*s == '<' || *s == '>')
+		sscanf(s+1,"%dx%d", &w, &h);
+	for (fp = formats; fp->s; fp++) {
+		if (*s == '>') {	/* look for a larger one */
+			if (fp->w <= w) {
+				if (fp > formats)
+					fp--; /* back one step if possible */
+				break;
+			}
+		} else if (*s == '<') {	/* look for a smaller one */
+			if (fp->w < w)
+				break;
+		} else if (!strcasecmp(s, fp->s)) { /* look for a string */
+			break;
+		}
+	}
+	if (*s == '<' && fp->s == NULL)	/* smallest */
+		fp--;
+	if (fp->s) {
+		b->w = fp->w;
+		b->h = fp->h;
+	} else if (sscanf(s, "%dx%d", &b->w, &b->h) != 2) {
+		ast_log(LOG_WARNING, "Invalid video_size %s, using 352x288\n", s);
+		b->w = 352;
+		b->h = 288;
+	}
+	return 0;
+}
+
+/* extend ast_cli with video commands. Called by console_video_config */
+int console_video_cli(struct video_desc *env, const char *var, int fd)
+{
+	if (env == NULL)
+		return 1;	/* unrecognised */
+
+        if (!strcasecmp(var, "videodevice")) {
+		ast_cli(fd, "videodevice is [%s]\n", env->out.videodevice);
+        } else if (!strcasecmp(var, "videocodec")) {
+		ast_cli(fd, "videocodec is [%s]\n", env->codec_name);
+        } else if (!strcasecmp(var, "sendvideo")) {
+		ast_cli(fd, "sendvideo is [%s]\n", env->out.sendvideo ? "on" : "off");
+        } else if (!strcasecmp(var, "video_size")) {
+		int in_w = 0, in_h = 0;
+		if (env->in) {
+			in_w = env->in->dec_out.w;
+			in_h = env->in->dec_out.h;
+		}
+		ast_cli(fd, "sizes: video %dx%d camera %dx%d local %dx%d remote %dx%d in %dx%d\n",
+			env->enc_in.w, env->enc_in.h,
+			env->out.loc_src_geometry.w, env->out.loc_src_geometry.h,
+			env->loc_dpy.w, env->loc_dpy.h,
+			env->rem_dpy.w, env->rem_dpy.h,
+			in_w, in_h);
+        } else if (!strcasecmp(var, "bitrate")) {
+		ast_cli(fd, "bitrate is [%d]\n", env->out.bitrate);
+        } else if (!strcasecmp(var, "qmin")) {
+		ast_cli(fd, "qmin is [%d]\n", env->out.qmin);
+        } else if (!strcasecmp(var, "fps")) {
+		ast_cli(fd, "fps is [%d]\n", env->out.fps);
+        } else if (!strcasecmp(var, "startgui")) {
+		console_video_start(env, NULL);
+        } else if (!strcasecmp(var, "stopgui") && env->stayopen != 0) {
+		env->stayopen = 0;
+		if (env->gui && env->owner)
+			ast_cli_command(-1, "console hangup");
+		else /* not in a call */
+			console_video_uninit(env);
+        } else {
+		return 1;	/* unrecognised */
+	}
+	return 0;	/* recognised */
+}
+
+/*! parse config command for video support. */
+int console_video_config(struct video_desc **penv,
+	const char *var, const char *val)
+{
+	struct video_desc *env;
+
+	if (penv == NULL) {
+		ast_log(LOG_WARNING, "bad argument penv=NULL\n");
+		return 1;	/* error */
+	}
+	/* allocate the video descriptor first time we get here */
+	env = *penv;
+	if (env == NULL) {
+		env = *penv = ast_calloc(1, sizeof(struct video_desc));
+		if (env == NULL) {
+			ast_log(LOG_WARNING, "fail to allocate video_desc\n");
+			return 1;	/* error */
+		
+		}
+		/* set default values */
+		ast_copy_string(env->out.videodevice, "X11", sizeof(env->out.videodevice));
+		env->out.fps = 5;
+		env->out.bitrate = 65000;
+		env->out.sendvideo = 1;
+		env->out.qmin = 3;
+	}
+	CV_START(var, val);
+	CV_STR("videodevice", env->out.videodevice);
+	CV_BOOL("sendvideo", env->out.sendvideo);
+	CV_F("video_size", video_geom(&env->enc_in, val));
+	CV_F("camera_size", video_geom(&env->out.loc_src_geometry, val));
+	CV_F("local_size", video_geom(&env->loc_dpy, val));
+	CV_F("remote_size", video_geom(&env->rem_dpy, val));
+	CV_STR("keypad", env->keypad_file);
+	CV_F("region", keypad_cfg_read(env->gui, val));
+	CV_STR("keypad_font", env->keypad_font);
+	CV_STR("sdl_videodriver", env->sdl_videodriver);
+	CV_UINT("fps", env->out.fps);
+	CV_UINT("bitrate", env->out.bitrate);
+	CV_UINT("qmin", env->out.qmin);
+	CV_STR("videocodec", env->codec_name);
+	return 1;	/* nothing found */
+
+	CV_END;		/* the 'nothing found' case */
+	return 0;		/* found something */
+}
+
+#endif	/* video support */