aboutsummaryrefslogtreecommitdiffstats
path: root/trunk/channels/console_video.c
diff options
context:
space:
mode:
Diffstat (limited to 'trunk/channels/console_video.c')
-rw-r--r--trunk/channels/console_video.c1035
1 files changed, 1035 insertions, 0 deletions
diff --git a/trunk/channels/console_video.c b/trunk/channels/console_video.c
new file mode 100644
index 000000000..554d03c39
--- /dev/null
+++ b/trunk/channels/console_video.c
@@ -0,0 +1,1035 @@
+/*
+ * Asterisk -- An open source telephony toolkit.
+ *
+ * Copyright 2007-2008, Marta Carbone, Sergio Fadda, Luigi Rizzo
+ *
+ * See http://www.asterisk.org for more information about
+ * the Asterisk project. Please do not directly contact
+ * any of the maintainers of this project for assistance;
+ * the project provides a web site, mailing lists and IRC
+ * channels for your use.
+ *
+ * This program is free software, distributed under the terms of
+ * the GNU General Public License Version 2. See the LICENSE file
+ * at the top of the source tree.
+ */
+
+/*
+ * Experimental support for video sessions. We use SDL for rendering, ffmpeg
+ * as the codec library for encoding and decoding, and Video4Linux and X11
+ * to generate the local video stream.
+ *
+ * If one of these pieces is not available, either at compile time or at
+ * runtime, we do our best to run without it. Of course, no codec library
+ * means we can only deal with raw data, no SDL means we cannot do rendering,
+ * no V4L or X11 means we cannot generate data (but in principle we could
+ * stream from or record to a file).
+ *
+ * We need a recent (2007.07.12 or newer) version of ffmpeg to avoid warnings.
+ * Older versions might give 'deprecated' messages during compilation,
+ * thus not compiling in AST_DEVMODE, or don't have swscale, in which case
+ * you can try to compile #defining OLD_FFMPEG here.
+ *
+ * $Revision$
+ */
+
+//#define DROP_PACKETS 5 /* if set, drop this % of video packets */
+//#define OLD_FFMPEG 1 /* set for old ffmpeg with no swscale */
+
+#include "asterisk.h"
+ASTERISK_FILE_VERSION(__FILE__, "$Revision$")
+#include <sys/ioctl.h>
+#include "asterisk/cli.h"
+#include "asterisk/file.h"
+#include "asterisk/channel.h"
+
+#include "console_video.h"
+
+/*
+The code is structured as follows.
+
+When a new console channel is created, we call console_video_start()
+to initialize SDL, the source, and the encoder/ decoder for the
+formats in use (XXX the latter two should be done later, once the
+codec negotiation is complete). Also, a thread is created to handle
+the video source and generate frames.
+
+While communication is on, the local source is generated by the
+video thread, which wakes up periodically, generates frames and
+enqueues them in chan->readq. Incoming rtp frames are passed to
+console_write_video(), decoded and passed to SDL for display.
+
+For as unfortunate and confusing as it can be, we need to deal with a
+number of different video representations (size, codec/pixel format,
+codec parameters), as follows:
+
+ loc_src is the data coming from the camera/X11/etc.
+ The format is typically constrained by the video source.
+
+ enc_in is the input required by the encoder.
+ Typically constrained in size by the encoder type.
+
+ enc_out is the bitstream transmitted over RTP.
+ Typically negotiated while the call is established.
+
+ loc_dpy is the format used to display the local video source.
+ Depending on user preferences this can have the same size as
+ loc_src_fmt, or enc_in_fmt, or thumbnail size (e.g. PiP output)
+
+ dec_in is the incoming RTP bitstream. Negotiated
+ during call establishment, it is not necessarily the same as
+ enc_in_fmt
+
+ dec_out the output of the decoder.
+ The format is whatever the other side sends, and the
+ buffer is allocated by avcodec_decode_... so we only
+ copy the data here.
+
+ rem_dpy the format used to display the remote stream
+
+We store the format info together with the buffer storing the data.
+As a future optimization, a format/buffer may reference another one
+if the formats are equivalent. This will save some unnecessary format
+conversion.
+
+
+In order to handle video you need to add to sip.conf (and presumably
+iax.conf too) the following:
+
+ [general](+)
+ videosupport=yes
+ allow=h263 ; this or other video formats
+ allow=h263p ; this or other video formats
+
+ */
+
+/*
+ * Codecs are absolutely necessary or we cannot do anything.
+ * SDL is optional (used for rendering only), so that we can still
+ * stream video withouth displaying it.
+ */
+#if !defined(HAVE_VIDEO_CONSOLE) || !defined(HAVE_FFMPEG)
+/* stubs if required pieces are missing */
+int console_write_video(struct ast_channel *chan, struct ast_frame *f)
+{
+ return 0; /* writing video not supported */
+}
+
+int console_video_cli(struct video_desc *env, const char *var, int fd)
+{
+ return 1; /* nothing matched */
+}
+
+int console_video_config(struct video_desc **penv, const char *var, const char *val)
+{
+ return 1; /* no configuration */
+}
+
+void console_video_start(struct video_desc *env, struct ast_channel *owner)
+{
+ ast_log(LOG_NOTICE, "voice only, console video support not present\n");
+}
+
+void console_video_uninit(struct video_desc *env)
+{
+}
+
+int console_video_formats = 0;
+
+#else /* defined(HAVE_FFMPEG) && defined(HAVE_SDL) */
+
+/*! The list of video formats we support. */
+int console_video_formats =
+ AST_FORMAT_H263_PLUS | AST_FORMAT_H263 |
+ AST_FORMAT_MP4_VIDEO | AST_FORMAT_H264 | AST_FORMAT_H261 ;
+
+
+
+static void my_scale(struct fbuf_t *in, AVPicture *p_in,
+ struct fbuf_t *out, AVPicture *p_out);
+
+struct video_codec_desc; /* forward declaration */
+/*
+ * Descriptor of the local source, made of the following pieces:
+ * + configuration info (geometry, device name, fps...). These are read
+ * from the config file and copied here before calling video_out_init();
+ * + the frame buffer (buf) and source pixel format, allocated at init time;
+ * + the encoding and RTP info, including timestamps to generate
+ * frames at the correct rate;
+ * + source-specific info, i.e. fd for /dev/video, dpy-image for x11, etc,
+ * filled in by grabber_open
+ * NOTE: loc_src.data == NULL means the rest of the struct is invalid, and
+ * the video source is not available.
+ */
+struct video_out_desc {
+ /* video device support.
+ * videodevice and geometry are read from the config file.
+ * At the right time we try to open it and allocate a buffer.
+ * If we are successful, webcam_bufsize > 0 and we can read.
+ */
+ /* all the following is config file info copied from the parent */
+ char videodevice[64];
+ int fps;
+ int bitrate;
+ int qmin;
+
+ int sendvideo;
+
+ struct fbuf_t loc_src_geometry; /* local source geometry only (from config file) */
+ struct fbuf_t enc_out; /* encoder output buffer, allocated in video_out_init() */
+
+ struct video_codec_desc *enc; /* encoder */
+ void *enc_ctx; /* encoding context */
+ AVCodec *codec;
+ AVFrame *enc_in_frame; /* enc_in mapped into avcodec format. */
+ /* The initial part of AVFrame is an AVPicture */
+ int mtu;
+ struct timeval last_frame; /* when we read the last frame ? */
+
+ struct grab_desc *grabber;
+ void *grabber_data;
+};
+
+/*
+ * The overall descriptor, with room for config info, video source and
+ * received data descriptors, SDL info, etc.
+ * This should be globally visible to all modules (grabber, vcodecs, gui)
+ * and contain all configurtion info.
+ */
+struct video_desc {
+ char codec_name[64]; /* the codec we use */
+
+ int stayopen; /* set if gui starts manually */
+ pthread_t vthread; /* video thread */
+ ast_mutex_t dec_lock; /* sync decoder and video thread */
+ int shutdown; /* set to shutdown vthread */
+ struct ast_channel *owner; /* owner channel */
+
+
+ struct fbuf_t enc_in; /* encoder input buffer, allocated in video_out_init() */
+
+ char keypad_file[256]; /* image for the keypad */
+ char keypad_font[256]; /* font for the keypad */
+
+ char sdl_videodriver[256];
+
+ struct fbuf_t rem_dpy; /* display remote video, no buffer (it is in win[WIN_REMOTE].bmp) */
+ struct fbuf_t loc_dpy; /* display local source, no buffer (managed by SDL in bmp[1]) */
+
+
+ /* local information for grabbers, codecs, gui */
+ struct gui_info *gui;
+ struct video_dec_desc *in; /* remote video descriptor */
+ struct video_out_desc out; /* local video descriptor */
+};
+
+static AVPicture *fill_pict(struct fbuf_t *b, AVPicture *p);
+
+void fbuf_free(struct fbuf_t *b)
+{
+ struct fbuf_t x = *b;
+
+ if (b->data && b->size)
+ ast_free(b->data);
+ bzero(b, sizeof(*b));
+ /* restore some fields */
+ b->w = x.w;
+ b->h = x.h;
+ b->pix_fmt = x.pix_fmt;
+}
+
+#include "vcodecs.c"
+#include "console_gui.c"
+
+/*! \brief Try to open a video source, return 0 on success, 1 on error */
+static int grabber_open(struct video_out_desc *v)
+{
+ struct grab_desc *g;
+ void *g_data;
+ int i;
+
+ for (i = 0; (g = console_grabbers[i]); i++) {
+ g_data = g->open(v->videodevice, &v->loc_src_geometry, v->fps);
+ if (g_data) {
+ v->grabber = g;
+ v->grabber_data = g_data;
+ return 0;
+ }
+ }
+ return 1; /* no source found */
+}
+
+/*! \brief complete a buffer from the local video source.
+ * Called by get_video_frames(), in turn called by the video thread.
+ */
+static struct fbuf_t *grabber_read(struct video_out_desc *v)
+{
+ struct timeval now = ast_tvnow();
+
+ if (v->grabber == NULL) /* not initialized */
+ return 0;
+
+ /* check if it is time to read */
+ if (ast_tvzero(v->last_frame))
+ v->last_frame = now;
+ if (ast_tvdiff_ms(now, v->last_frame) < 1000/v->fps)
+ return 0; /* too early */
+ v->last_frame = now; /* XXX actually, should correct for drift */
+ return v->grabber->read(v->grabber_data);
+}
+
+/*! \brief handler run when dragging with the left button on
+ * the local source window - the effect is to move the offset
+ * of the captured area.
+ */
+static void grabber_move(struct video_out_desc *v, int dx, int dy)
+{
+ if (v->grabber && v->grabber->move)
+ v->grabber->move(v->grabber_data, dx, dy);
+}
+
+/*
+ * Map the codec name to the library. If not recognised, use a default.
+ * This is useful in the output path where we decide by name, presumably.
+ */
+static struct video_codec_desc *map_config_video_format(char *name)
+{
+ int i;
+
+ for (i = 0; supported_codecs[i]; i++)
+ if (!strcasecmp(name, supported_codecs[i]->name))
+ break;
+ if (supported_codecs[i] == NULL) {
+ ast_log(LOG_WARNING, "Cannot find codec for '%s'\n", name);
+ i = 0;
+ strcpy(name, supported_codecs[i]->name);
+ }
+ ast_log(LOG_WARNING, "Using codec '%s'\n", name);
+ return supported_codecs[i];
+}
+
+
+/*! \brief uninitialize the descriptor for local video stream */
+static int video_out_uninit(struct video_desc *env)
+{
+ struct video_out_desc *v = &env->out;
+
+ /* XXX this should be a codec callback */
+ if (v->enc_ctx) {
+ AVCodecContext *enc_ctx = (AVCodecContext *)v->enc_ctx;
+ avcodec_close(enc_ctx);
+ av_free(enc_ctx);
+ v->enc_ctx = NULL;
+ }
+ if (v->enc_in_frame) {
+ av_free(v->enc_in_frame);
+ v->enc_in_frame = NULL;
+ }
+ v->codec = NULL; /* nothing to free, this is only a reference */
+ /* release the buffers */
+ fbuf_free(&env->enc_in);
+ fbuf_free(&v->enc_out);
+ /* close the grabber */
+ if (v->grabber) {
+ v->grabber_data = v->grabber->close(v->grabber_data);
+ v->grabber = NULL;
+ }
+ return -1;
+}
+
+/*
+ * Initialize the encoder for the local source:
+ * - enc_ctx, codec, enc_in_frame are used by ffmpeg for encoding;
+ * - enc_out is used to store the encoded frame (to be sent)
+ * - mtu is used to determine the max size of video fragment
+ * NOTE: we enter here with the video source already open.
+ */
+static int video_out_init(struct video_desc *env)
+{
+ int codec;
+ int size;
+ struct fbuf_t *enc_in;
+ struct video_out_desc *v = &env->out;
+
+ v->enc_ctx = NULL;
+ v->codec = NULL;
+ v->enc_in_frame = NULL;
+ v->enc_out.data = NULL;
+
+ codec = map_video_format(v->enc->format, CM_WR);
+ v->codec = avcodec_find_encoder(codec);
+ if (!v->codec) {
+ ast_log(LOG_WARNING, "Cannot find the encoder for format %d\n",
+ codec);
+ return -1; /* error, but nothing to undo yet */
+ }
+
+ v->mtu = 1400; /* set it early so the encoder can use it */
+
+ /* allocate the input buffer for encoding.
+ * ffmpeg only supports PIX_FMT_YUV420P for the encoding.
+ */
+ enc_in = &env->enc_in;
+ enc_in->pix_fmt = PIX_FMT_YUV420P;
+ enc_in->size = (enc_in->w * enc_in->h * 3)/2;
+ enc_in->data = ast_calloc(1, enc_in->size);
+ if (!enc_in->data) {
+ ast_log(LOG_WARNING, "Cannot allocate encoder input buffer\n");
+ return video_out_uninit(env);
+ }
+ /* construct an AVFrame that points into buf_in */
+ v->enc_in_frame = avcodec_alloc_frame();
+ if (!v->enc_in_frame) {
+ ast_log(LOG_WARNING, "Unable to allocate the encoding video frame\n");
+ return video_out_uninit(env);
+ }
+
+ /* parameters for PIX_FMT_YUV420P */
+ size = enc_in->w * enc_in->h;
+ v->enc_in_frame->data[0] = enc_in->data;
+ v->enc_in_frame->data[1] = v->enc_in_frame->data[0] + size;
+ v->enc_in_frame->data[2] = v->enc_in_frame->data[1] + size/4;
+ v->enc_in_frame->linesize[0] = enc_in->w;
+ v->enc_in_frame->linesize[1] = enc_in->w/2;
+ v->enc_in_frame->linesize[2] = enc_in->w/2;
+
+ /* now setup the parameters for the encoder.
+ * XXX should be codec-specific
+ */
+ {
+ AVCodecContext *enc_ctx = avcodec_alloc_context();
+ v->enc_ctx = enc_ctx;
+ enc_ctx->pix_fmt = enc_in->pix_fmt;
+ enc_ctx->width = enc_in->w;
+ enc_ctx->height = enc_in->h;
+ /* XXX rtp_callback ?
+ * rtp_mode so ffmpeg inserts as many start codes as possible.
+ */
+ enc_ctx->rtp_mode = 1;
+ enc_ctx->rtp_payload_size = v->mtu / 2; // mtu/2
+ enc_ctx->bit_rate = v->bitrate;
+ enc_ctx->bit_rate_tolerance = enc_ctx->bit_rate/2;
+ enc_ctx->qmin = v->qmin; /* should be configured */
+ enc_ctx->time_base = (AVRational){1, v->fps};
+ enc_ctx->gop_size = v->fps*5; // emit I frame every 5 seconds
+
+ v->enc->enc_init(v->enc_ctx);
+
+ if (avcodec_open(enc_ctx, v->codec) < 0) {
+ ast_log(LOG_WARNING, "Unable to initialize the encoder %d\n",
+ codec);
+ av_free(enc_ctx);
+ v->enc_ctx = NULL;
+ return video_out_uninit(env);
+ }
+ }
+ /*
+ * Allocate enough for the encoded bitstream. As we are compressing,
+ * we hope that the output is never larger than the input size.
+ */
+ v->enc_out.data = ast_calloc(1, enc_in->size);
+ v->enc_out.size = enc_in->size;
+ v->enc_out.used = 0;
+
+ return 0;
+}
+
+/*! \brief possibly uninitialize the video console.
+ * Called at the end of a call, should reset the 'owner' field,
+ * then possibly terminate the video thread if the gui has
+ * not been started manually.
+ * In practice, signal the thread and give it a bit of time to
+ * complete, giving up if it gets stuck. Because uninit
+ * is called from hangup with the channel locked, and the thread
+ * uses the chan lock, we need to unlock here. This is unsafe,
+ * and we should really use refcounts for the channels.
+ */
+void console_video_uninit(struct video_desc *env)
+{
+ int i, t = 100; /* initial wait is shorter, than make it longer */
+ if (env->stayopen == 0) { /* in a call */
+ env->shutdown = 1;
+ for (i=0; env->shutdown && i < 10; i++) {
+ if (env->owner)
+ ast_channel_unlock(env->owner);
+ usleep(t);
+ t = 1000000;
+ if (env->owner)
+ ast_channel_lock(env->owner);
+ }
+ }
+ env->owner = NULL; /* this is unconditional */
+}
+
+/*! fill an AVPicture from our fbuf info, as it is required by
+ * the image conversion routines in ffmpeg.
+ * XXX This depends on the format.
+ */
+static AVPicture *fill_pict(struct fbuf_t *b, AVPicture *p)
+{
+ /* provide defaults for commonly used formats */
+ int l4 = b->w * b->h/4; /* size of U or V frame */
+ int len = b->w; /* Y linesize, bytes */
+ int luv = b->w/2; /* U/V linesize, bytes */
+
+ bzero(p, sizeof(*p));
+ switch (b->pix_fmt) {
+ case PIX_FMT_RGB555:
+ case PIX_FMT_RGB565:
+ len *= 2;
+ luv = 0;
+ break;
+ case PIX_FMT_RGBA32:
+ len *= 4;
+ luv = 0;
+ break;
+ case PIX_FMT_YUYV422: /* Packed YUV 4:2:2, 16bpp, Y0 Cb Y1 Cr */
+ len *= 2; /* all data in first plane, probably */
+ luv = 0;
+ break;
+ }
+ p->data[0] = b->data;
+ p->linesize[0] = len;
+ /* these are only valid for component images */
+ p->data[1] = luv ? b->data + 4*l4 : b->data+len;
+ p->data[2] = luv ? b->data + 5*l4 : b->data+len;
+ p->linesize[1] = luv;
+ p->linesize[2] = luv;
+ return p;
+}
+
+/*! convert/scale between an input and an output format.
+ * Old version of ffmpeg only have img_convert, which does not rescale.
+ * New versions use sws_scale which does both.
+ */
+static void my_scale(struct fbuf_t *in, AVPicture *p_in,
+ struct fbuf_t *out, AVPicture *p_out)
+{
+ AVPicture my_p_in, my_p_out;
+
+ if (p_in == NULL)
+ p_in = fill_pict(in, &my_p_in);
+ if (p_out == NULL)
+ p_out = fill_pict(out, &my_p_out);
+
+#ifdef OLD_FFMPEG
+ /* XXX img_convert is deprecated, and does not do rescaling */
+ img_convert(p_out, out->pix_fmt,
+ p_in, in->pix_fmt, in->w, in->h);
+#else /* XXX replacement */
+ {
+ struct SwsContext *convert_ctx;
+
+ convert_ctx = sws_getContext(in->w, in->h, in->pix_fmt,
+ out->w, out->h, out->pix_fmt,
+ SWS_BICUBIC, NULL, NULL, NULL);
+ if (convert_ctx == NULL) {
+ ast_log(LOG_ERROR, "FFMPEG::convert_cmodel : swscale context initialization failed");
+ return;
+ }
+ if (0)
+ ast_log(LOG_WARNING, "in %d %dx%d out %d %dx%d\n",
+ in->pix_fmt, in->w, in->h, out->pix_fmt, out->w, out->h);
+ sws_scale(convert_ctx,
+ p_in->data, p_in->linesize,
+ in->w, in->h, /* src slice */
+ p_out->data, p_out->linesize);
+
+ sws_freeContext(convert_ctx);
+ }
+#endif /* XXX replacement */
+}
+
+struct video_desc *get_video_desc(struct ast_channel *c);
+
+/*
+ * This function is called (by asterisk) for each video packet
+ * coming from the network (the 'in' path) that needs to be processed.
+ * We need to reconstruct the entire video frame before we can decode it.
+ * After a video packet is received we have to:
+ * - extract the bitstream with pre_process_data()
+ * - append the bitstream to a buffer
+ * - if the fragment is the last (RTP Marker) we decode it with decode_video()
+ * - after the decoding is completed we display the decoded frame with show_frame()
+ */
+int console_write_video(struct ast_channel *chan, struct ast_frame *f);
+int console_write_video(struct ast_channel *chan, struct ast_frame *f)
+{
+ struct video_desc *env = get_video_desc(chan);
+ struct video_dec_desc *v = env->in;
+
+ if (!env->gui) /* no gui, no rendering */
+ return 0;
+ if (v == NULL)
+ env->in = v = dec_init(f->subclass & ~1);
+ if (v == NULL) {
+ /* This is not fatal, but we won't have incoming video */
+ ast_log(LOG_WARNING, "Cannot initialize input decoder\n");
+ return 0;
+ }
+
+ if (v->dec_in_cur == NULL) /* no buffer for incoming frames, drop */
+ return 0;
+#if defined(DROP_PACKETS) && DROP_PACKETS > 0
+ /* Simulate lost packets */
+ if ((random() % 10000) <= 100*DROP_PACKETS) {
+ ast_log(LOG_NOTICE, "Packet lost [%d]\n", f->seqno);
+ return 0;
+ }
+#endif
+ if (v->discard) {
+ /*
+ * In discard mode, drop packets until we find one with
+ * the RTP marker set (which is the end of frame).
+ * Note that the RTP marker flag is sent as the LSB of the
+ * subclass, which is a bitmask of formats. The low bit is
+ * normally used for audio so there is no interference.
+ */
+ if (f->subclass & 0x01) {
+ v->dec_in_cur->used = 0;
+ v->dec_in_cur->ebit = 0;
+ v->next_seq = f->seqno + 1; /* wrap at 16 bit */
+ v->discard = 0;
+ ast_log(LOG_WARNING, "out of discard mode, frame %d\n", f->seqno);
+ }
+ return 0;
+ }
+
+ /*
+ * Only in-order fragments will be accepted. Remember seqno
+ * has 16 bit so there is wraparound. Also, ideally we could
+ * accept a bit of reordering, but at the moment we don't.
+ */
+ if (v->next_seq != f->seqno) {
+ ast_log(LOG_WARNING, "discarding frame out of order, %d %d\n",
+ v->next_seq, f->seqno);
+ v->discard = 1;
+ return 0;
+ }
+ v->next_seq++;
+
+ if (f->data == NULL || f->datalen < 2) {
+ ast_log(LOG_WARNING, "empty video frame, discard\n");
+ return 0;
+ }
+ if (v->d_callbacks->dec_decap(v->dec_in_cur, f->data, f->datalen)) {
+ ast_log(LOG_WARNING, "error in dec_decap, enter discard\n");
+ v->discard = 1;
+ }
+ if (f->subclass & 0x01) { // RTP Marker
+ /* prepare to decode: advance the buffer so the video thread knows. */
+ struct fbuf_t *tmp = v->dec_in_cur; /* store current pointer */
+ ast_mutex_lock(&env->dec_lock);
+ if (++v->dec_in_cur == &v->dec_in[N_DEC_IN]) /* advance to next, circular */
+ v->dec_in_cur = &v->dec_in[0];
+ if (v->dec_in_dpy == NULL) { /* were not displaying anything, so set it */
+ v->dec_in_dpy = tmp;
+ } else if (v->dec_in_dpy == v->dec_in_cur) { /* current slot is busy */
+ v->dec_in_cur = NULL;
+ }
+ ast_mutex_unlock(&env->dec_lock);
+ }
+ return 0;
+}
+
+
+/*! \brief read a frame from webcam or X11 through grabber_read(),
+ * display it, then encode and split it.
+ * Return a list of ast_frame representing the video fragments.
+ * The head pointer is returned by the function, the tail pointer
+ * is returned as an argument.
+ */
+static struct ast_frame *get_video_frames(struct video_desc *env, struct ast_frame **tail)
+{
+ struct video_out_desc *v = &env->out;
+ struct ast_frame *dummy;
+ struct fbuf_t *loc_src = grabber_read(v);
+
+ if (!loc_src)
+ return NULL; /* can happen, e.g. we are reading too early */
+
+ if (tail == NULL)
+ tail = &dummy;
+ *tail = NULL;
+ /* Scale the video for the encoder, then use it for local rendering
+ * so we will see the same as the remote party.
+ */
+ my_scale(loc_src, NULL, &env->enc_in, NULL);
+ show_frame(env, WIN_LOCAL);
+ if (!v->sendvideo)
+ return NULL;
+ if (v->enc_out.data == NULL) {
+ static volatile int a = 0;
+ if (a++ < 2)
+ ast_log(LOG_WARNING, "fail, no encoder output buffer\n");
+ return NULL;
+ }
+ v->enc->enc_run(v);
+ return v->enc->enc_encap(&v->enc_out, v->mtu, tail);
+}
+
+/*
+ * Helper thread to periodically poll the video source and enqueue the
+ * generated frames to the channel's queue.
+ * Using a separate thread also helps because the encoding can be
+ * computationally expensive so we don't want to starve the main thread.
+ */
+static void *video_thread(void *arg)
+{
+ struct video_desc *env = arg;
+ int count = 0;
+ char save_display[128] = "";
+
+ /* if sdl_videodriver is set, override the environment. Also,
+ * if it contains 'console' override DISPLAY around the call to SDL_Init
+ * so we use the console as opposed to the x11 version of aalib
+ */
+ if (!ast_strlen_zero(env->sdl_videodriver)) { /* override */
+ const char *s = getenv("DISPLAY");
+ setenv("SDL_VIDEODRIVER", env->sdl_videodriver, 1);
+ if (s && !strcasecmp(env->sdl_videodriver, "aalib-console")) {
+ ast_copy_string(save_display, s, sizeof(save_display));
+ unsetenv("DISPLAY");
+ }
+ }
+ sdl_setup(env);
+ if (!ast_strlen_zero(save_display))
+ setenv("DISPLAY", save_display, 1);
+
+ /* initialize grab coordinates */
+ env->out.loc_src_geometry.x = 0;
+ env->out.loc_src_geometry.y = 0;
+
+ ast_mutex_init(&env->dec_lock); /* used to sync decoder and renderer */
+
+ if (grabber_open(&env->out)) {
+ ast_log(LOG_WARNING, "cannot open local video source\n");
+ } else {
+#if 0
+ /* In principle, try to register the fd.
+ * In practice, many webcam drivers do not support select/poll,
+ * so don't bother and instead read periodically from the
+ * video thread.
+ */
+ if (env->out.fd >= 0)
+ ast_channel_set_fd(env->owner, 1, env->out.fd);
+#endif
+ video_out_init(env);
+ }
+
+ for (;;) {
+ struct timeval t = { 0, 50000 }; /* XXX 20 times/sec */
+ struct ast_frame *p, *f;
+ struct ast_channel *chan;
+ int fd;
+ char *caption = NULL, buf[160];
+
+ /* determine if video format changed */
+ if (count++ % 10 == 0) {
+ if (env->out.sendvideo)
+ sprintf(buf, "%s %s %dx%d @@ %dfps %dkbps",
+ env->out.videodevice, env->codec_name,
+ env->enc_in.w, env->enc_in.h,
+ env->out.fps, env->out.bitrate/1000);
+ else
+ sprintf(buf, "hold");
+ caption = buf;
+ }
+
+ /* manage keypad events */
+ /* XXX here we should always check for events,
+ * otherwise the drag will not work */
+ if (env->gui)
+ eventhandler(env, caption);
+
+ /* sleep for a while */
+ ast_select(0, NULL, NULL, NULL, &t);
+
+ if (env->in) {
+ struct video_dec_desc *v = env->in;
+
+ /*
+ * While there is something to display, call the decoder and free
+ * the buffer, possibly enabling the receiver to store new data.
+ */
+ while (v->dec_in_dpy) {
+ struct fbuf_t *tmp = v->dec_in_dpy; /* store current pointer */
+
+ if (v->d_callbacks->dec_run(v, tmp))
+ show_frame(env, WIN_REMOTE);
+ tmp->used = 0; /* mark buffer as free */
+ tmp->ebit = 0;
+ ast_mutex_lock(&env->dec_lock);
+ if (++v->dec_in_dpy == &v->dec_in[N_DEC_IN]) /* advance to next, circular */
+ v->dec_in_dpy = &v->dec_in[0];
+
+ if (v->dec_in_cur == NULL) /* receiver was idle, enable it... */
+ v->dec_in_cur = tmp; /* using the slot just freed */
+ else if (v->dec_in_dpy == v->dec_in_cur) /* this was the last slot */
+ v->dec_in_dpy = NULL; /* nothing more to display */
+ ast_mutex_unlock(&env->dec_lock);
+ }
+ }
+
+ if (env->shutdown)
+ break;
+ f = get_video_frames(env, &p); /* read and display */
+ if (!f)
+ continue;
+ chan = env->owner;
+ if (chan == NULL)
+ continue;
+ fd = chan->alertpipe[1];
+ ast_channel_lock(chan);
+
+ /* AST_LIST_INSERT_TAIL is only good for one frame, cannot use here */
+ if (chan->readq.first == NULL) {
+ chan->readq.first = f;
+ } else {
+ chan->readq.last->frame_list.next = f;
+ }
+ chan->readq.last = p;
+ /*
+ * more or less same as ast_queue_frame, but extra
+ * write on the alertpipe to signal frames.
+ */
+ if (fd > -1) {
+ int blah = 1, l = sizeof(blah);
+ for (p = f; p; p = AST_LIST_NEXT(p, frame_list)) {
+ if (write(fd, &blah, l) != l)
+ ast_log(LOG_WARNING, "Unable to write to alert pipe on %s, frametype/subclass %d/%d: %s!\n",
+ chan->name, f->frametype, f->subclass, strerror(errno));
+ }
+ }
+ ast_channel_unlock(chan);
+ }
+ /* thread terminating, here could call the uninit */
+ /* uninitialize the local and remote video environments */
+ env->in = dec_uninit(env->in);
+ video_out_uninit(env);
+
+ if (env->gui)
+ env->gui = cleanup_sdl(env->gui);
+ ast_mutex_destroy(&env->dec_lock);
+ env->shutdown = 0;
+ return NULL;
+}
+
+static void copy_geometry(struct fbuf_t *src, struct fbuf_t *dst)
+{
+ if (dst->w == 0)
+ dst->w = src->w;
+ if (dst->h == 0)
+ dst->h = src->h;
+}
+
+/*! initialize the video environment.
+ * Apart from the formats (constant) used by sdl and the codec,
+ * we use enc_in as the basic geometry.
+ */
+static void init_env(struct video_desc *env)
+{
+ struct fbuf_t *c = &(env->out.loc_src_geometry); /* local source */
+ struct fbuf_t *ei = &(env->enc_in); /* encoder input */
+ struct fbuf_t *ld = &(env->loc_dpy); /* local display */
+ struct fbuf_t *rd = &(env->rem_dpy); /* remote display */
+
+ c->pix_fmt = PIX_FMT_YUV420P; /* default - camera format */
+ ei->pix_fmt = PIX_FMT_YUV420P; /* encoder input */
+ if (ei->w == 0 || ei->h == 0) {
+ ei->w = 352;
+ ei->h = 288;
+ }
+ ld->pix_fmt = rd->pix_fmt = PIX_FMT_YUV420P; /* sdl format */
+ /* inherit defaults */
+ copy_geometry(ei, c); /* camera inherits from encoder input */
+ copy_geometry(ei, rd); /* remote display inherits from encoder input */
+ copy_geometry(rd, ld); /* local display inherits from remote display */
+}
+
+/*!
+ * The first call to the video code, called by oss_new() or similar.
+ * Here we initialize the various components we use, namely SDL for display,
+ * ffmpeg for encoding/decoding, and a local video source.
+ * We do our best to progress even if some of the components are not
+ * available.
+ */
+void console_video_start(struct video_desc *env, struct ast_channel *owner)
+{
+ ast_log(LOG_WARNING, "env %p chan %p\n", env, owner);
+ if (env == NULL) /* video not initialized */
+ return;
+ env->owner = owner; /* work even if no owner is specified */
+ if (env->stayopen)
+ return; /* already initialized, nothing to do */
+ init_env(env);
+ env->out.enc = map_config_video_format(env->codec_name);
+
+ ast_log(LOG_WARNING, "start video out %s %dx%d\n",
+ env->codec_name, env->enc_in.w, env->enc_in.h);
+ /*
+ * Register all codecs supported by the ffmpeg library.
+ * We only need to do it once, but probably doesn't
+ * harm to do it multiple times.
+ */
+ avcodec_init();
+ avcodec_register_all();
+ av_log_set_level(AV_LOG_ERROR); /* only report errors */
+
+ if (env->out.fps == 0) {
+ env->out.fps = 15;
+ ast_log(LOG_WARNING, "fps unset, forcing to %d\n", env->out.fps);
+ }
+ if (env->out.bitrate == 0) {
+ env->out.bitrate = 65000;
+ ast_log(LOG_WARNING, "bitrate unset, forcing to %d\n", env->out.bitrate);
+ }
+ ast_pthread_create_background(&env->vthread, NULL, video_thread, env);
+ if (env->owner == NULL)
+ env->stayopen = 1; /* manually opened so don't close on hangup */
+}
+
+/*
+ * Parse a geometry string, accepting also common names for the formats.
+ * Trick: if we have a leading > or < and a numeric geometry,
+ * return the larger or smaller one.
+ * E.g. <352x288 gives the smaller one, 320x240
+ */
+static int video_geom(struct fbuf_t *b, const char *s)
+{
+ int w = 0, h = 0;
+
+ static struct {
+ const char *s; int w; int h;
+ } *fp, formats[] = {
+ {"16cif", 1408, 1152 },
+ {"xga", 1024, 768 },
+ {"4cif", 704, 576 },
+ {"vga", 640, 480 },
+ {"cif", 352, 288 },
+ {"qvga", 320, 240 },
+ {"qcif", 176, 144 },
+ {"sqcif", 128, 96 },
+ {NULL, 0, 0 },
+ };
+ if (*s == '<' || *s == '>')
+ sscanf(s+1,"%dx%d", &w, &h);
+ for (fp = formats; fp->s; fp++) {
+ if (*s == '>') { /* look for a larger one */
+ if (fp->w <= w) {
+ if (fp > formats)
+ fp--; /* back one step if possible */
+ break;
+ }
+ } else if (*s == '<') { /* look for a smaller one */
+ if (fp->w < w)
+ break;
+ } else if (!strcasecmp(s, fp->s)) { /* look for a string */
+ break;
+ }
+ }
+ if (*s == '<' && fp->s == NULL) /* smallest */
+ fp--;
+ if (fp->s) {
+ b->w = fp->w;
+ b->h = fp->h;
+ } else if (sscanf(s, "%dx%d", &b->w, &b->h) != 2) {
+ ast_log(LOG_WARNING, "Invalid video_size %s, using 352x288\n", s);
+ b->w = 352;
+ b->h = 288;
+ }
+ return 0;
+}
+
+/* extend ast_cli with video commands. Called by console_video_config */
+int console_video_cli(struct video_desc *env, const char *var, int fd)
+{
+ if (env == NULL)
+ return 1; /* unrecognised */
+
+ if (!strcasecmp(var, "videodevice")) {
+ ast_cli(fd, "videodevice is [%s]\n", env->out.videodevice);
+ } else if (!strcasecmp(var, "videocodec")) {
+ ast_cli(fd, "videocodec is [%s]\n", env->codec_name);
+ } else if (!strcasecmp(var, "sendvideo")) {
+ ast_cli(fd, "sendvideo is [%s]\n", env->out.sendvideo ? "on" : "off");
+ } else if (!strcasecmp(var, "video_size")) {
+ int in_w = 0, in_h = 0;
+ if (env->in) {
+ in_w = env->in->dec_out.w;
+ in_h = env->in->dec_out.h;
+ }
+ ast_cli(fd, "sizes: video %dx%d camera %dx%d local %dx%d remote %dx%d in %dx%d\n",
+ env->enc_in.w, env->enc_in.h,
+ env->out.loc_src_geometry.w, env->out.loc_src_geometry.h,
+ env->loc_dpy.w, env->loc_dpy.h,
+ env->rem_dpy.w, env->rem_dpy.h,
+ in_w, in_h);
+ } else if (!strcasecmp(var, "bitrate")) {
+ ast_cli(fd, "bitrate is [%d]\n", env->out.bitrate);
+ } else if (!strcasecmp(var, "qmin")) {
+ ast_cli(fd, "qmin is [%d]\n", env->out.qmin);
+ } else if (!strcasecmp(var, "fps")) {
+ ast_cli(fd, "fps is [%d]\n", env->out.fps);
+ } else if (!strcasecmp(var, "startgui")) {
+ console_video_start(env, NULL);
+ } else if (!strcasecmp(var, "stopgui") && env->stayopen != 0) {
+ env->stayopen = 0;
+ if (env->gui && env->owner)
+ ast_cli_command(-1, "console hangup");
+ else /* not in a call */
+ console_video_uninit(env);
+ } else {
+ return 1; /* unrecognised */
+ }
+ return 0; /* recognised */
+}
+
+/*! parse config command for video support. */
+int console_video_config(struct video_desc **penv,
+ const char *var, const char *val)
+{
+ struct video_desc *env;
+
+ if (penv == NULL) {
+ ast_log(LOG_WARNING, "bad argument penv=NULL\n");
+ return 1; /* error */
+ }
+ /* allocate the video descriptor first time we get here */
+ env = *penv;
+ if (env == NULL) {
+ env = *penv = ast_calloc(1, sizeof(struct video_desc));
+ if (env == NULL) {
+ ast_log(LOG_WARNING, "fail to allocate video_desc\n");
+ return 1; /* error */
+
+ }
+ /* set default values */
+ ast_copy_string(env->out.videodevice, "X11", sizeof(env->out.videodevice));
+ env->out.fps = 5;
+ env->out.bitrate = 65000;
+ env->out.sendvideo = 1;
+ env->out.qmin = 3;
+ }
+ CV_START(var, val);
+ CV_STR("videodevice", env->out.videodevice);
+ CV_BOOL("sendvideo", env->out.sendvideo);
+ CV_F("video_size", video_geom(&env->enc_in, val));
+ CV_F("camera_size", video_geom(&env->out.loc_src_geometry, val));
+ CV_F("local_size", video_geom(&env->loc_dpy, val));
+ CV_F("remote_size", video_geom(&env->rem_dpy, val));
+ CV_STR("keypad", env->keypad_file);
+ CV_F("region", keypad_cfg_read(env->gui, val));
+ CV_STR("keypad_font", env->keypad_font);
+ CV_STR("sdl_videodriver", env->sdl_videodriver);
+ CV_UINT("fps", env->out.fps);
+ CV_UINT("bitrate", env->out.bitrate);
+ CV_UINT("qmin", env->out.qmin);
+ CV_STR("videocodec", env->codec_name);
+ return 1; /* nothing found */
+
+ CV_END; /* the 'nothing found' case */
+ return 0; /* found something */
+}
+
+#endif /* video support */