msvideo1enc.c
Go to the documentation of this file.
1 /*
2  * Microsoft Video-1 Encoder
3  * Copyright (c) 2009 Konstantin Shishkov
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 /**
23  * @file
24  * Microsoft Video-1 encoder
25  */
26 
27 #include "avcodec.h"
28 #include "internal.h"
29 #include "bytestream.h"
30 #include "libavutil/lfg.h"
31 #include "elbg.h"
32 #include "libavutil/imgutils.h"
33 /**
34  * Encoder context
35  */
36 typedef struct Msvideo1EncContext {
41 
42  int block[16*3];
43  int block2[16*3];
44  int codebook[8*3];
45  int codebook2[8*3];
46  int output[16*3];
47  int output2[16*3];
48  int avg[3];
49  int bestpos;
50  int keyint;
52 
53 enum MSV1Mode{
54  MODE_SKIP = 0,
58 };
59 
60 #define SKIP_PREFIX 0x8400
61 #define SKIPS_MAX 0x0FFF
62 #define MKRGB555(in, off) ((in[off] << 10) | (in[off + 1] << 5) | (in[off + 2]))
63 
64 static const int remap[16] = { 0, 1, 4, 5, 2, 3, 6, 7, 8, 9, 12, 13, 10, 11, 14, 15 };
65 
67  const AVFrame *pict, int *got_packet)
68 {
69  Msvideo1EncContext * const c = avctx->priv_data;
70  AVFrame * const p = &c->pic;
71  uint16_t *src;
72  uint8_t *prevptr;
73  uint8_t *dst, *buf;
74  int keyframe = 0;
75  int no_skips = 1;
76  int i, j, k, x, y, ret;
77  int skips = 0;
78 
79  if ((ret = ff_alloc_packet2(avctx, pkt, avctx->width*avctx->height*9 + FF_MIN_BUFFER_SIZE)) < 0)
80  return ret;
81  dst= buf= pkt->data;
82 
83  *p = *pict;
84  if(!c->prev)
85  c->prev = av_malloc(avctx->width * 3 * (avctx->height + 3));
86  prevptr = c->prev + avctx->width * 3 * (FFALIGN(avctx->height, 4) - 1);
87  src = (uint16_t*)(p->data[0] + p->linesize[0]*(FFALIGN(avctx->height, 4) - 1));
88  if(c->keyint >= avctx->keyint_min)
89  keyframe = 1;
90 
91  p->quality = 24;
92 
93  for(y = 0; y < avctx->height; y += 4){
94  for(x = 0; x < avctx->width; x += 4){
95  int bestmode = MODE_SKIP;
96  int bestscore = INT_MAX;
97  int flags = 0;
98  int score;
99 
100  for(j = 0; j < 4; j++){
101  for(i = 0; i < 4; i++){
102  uint16_t val = src[x + i - j*p->linesize[0]/2];
103  for(k = 0; k < 3; k++){
104  c->block[(i + j*4)*3 + k] =
105  c->block2[remap[i + j*4]*3 + k] = (val >> (10-k*5)) & 0x1F;
106  }
107  }
108  }
109  if(!keyframe){
110  bestscore = 0;
111  for(j = 0; j < 4; j++){
112  for(i = 0; i < 4*3; i++){
113  int t = prevptr[x*3 + i - j*3*avctx->width] - c->block[i + j*4*3];
114  bestscore += t*t;
115  }
116  }
117  bestscore /= p->quality;
118  }
119  // try to find optimal value to fill whole 4x4 block
120  score = 0;
121  ff_init_elbg(c->block, 3, 16, c->avg, 1, 1, c->output, &c->rnd);
122  ff_do_elbg (c->block, 3, 16, c->avg, 1, 1, c->output, &c->rnd);
123  if(c->avg[0] == 1) // red component = 1 will be written as skip code
124  c->avg[0] = 0;
125  for(j = 0; j < 4; j++){
126  for(i = 0; i < 4; i++){
127  for(k = 0; k < 3; k++){
128  int t = c->avg[k] - c->block[(i+j*4)*3+k];
129  score += t*t;
130  }
131  }
132  }
133  score /= p->quality;
134  score += 2;
135  if(score < bestscore){
136  bestscore = score;
137  bestmode = MODE_FILL;
138  }
139  // search for optimal filling of 2-color block
140  score = 0;
141  ff_init_elbg(c->block, 3, 16, c->codebook, 2, 1, c->output, &c->rnd);
142  ff_do_elbg (c->block, 3, 16, c->codebook, 2, 1, c->output, &c->rnd);
143  // last output value should be always 1, swap codebooks if needed
144  if(!c->output[15]){
145  for(i = 0; i < 3; i++)
146  FFSWAP(uint8_t, c->codebook[i], c->codebook[i+3]);
147  for(i = 0; i < 16; i++)
148  c->output[i] ^= 1;
149  }
150  for(j = 0; j < 4; j++){
151  for(i = 0; i < 4; i++){
152  for(k = 0; k < 3; k++){
153  int t = c->codebook[c->output[i+j*4]*3 + k] - c->block[i*3+k+j*4*3];
154  score += t*t;
155  }
156  }
157  }
158  score /= p->quality;
159  score += 6;
160  if(score < bestscore){
161  bestscore = score;
162  bestmode = MODE_2COL;
163  }
164  // search for optimal filling of 2-color 2x2 subblocks
165  score = 0;
166  for(i = 0; i < 4; i++){
167  ff_init_elbg(c->block2 + i*4*3, 3, 4, c->codebook2 + i*2*3, 2, 1, c->output2 + i*4, &c->rnd);
168  ff_do_elbg (c->block2 + i*4*3, 3, 4, c->codebook2 + i*2*3, 2, 1, c->output2 + i*4, &c->rnd);
169  }
170  // last value should be always 1, swap codebooks if needed
171  if(!c->output2[15]){
172  for(i = 0; i < 3; i++)
173  FFSWAP(uint8_t, c->codebook2[i+18], c->codebook2[i+21]);
174  for(i = 12; i < 16; i++)
175  c->output2[i] ^= 1;
176  }
177  for(j = 0; j < 4; j++){
178  for(i = 0; i < 4; i++){
179  for(k = 0; k < 3; k++){
180  int t = c->codebook2[(c->output2[remap[i+j*4]] + (i&2) + (j&2)*2)*3+k] - c->block[i*3+k + j*4*3];
181  score += t*t;
182  }
183  }
184  }
185  score /= p->quality;
186  score += 18;
187  if(score < bestscore){
188  bestscore = score;
189  bestmode = MODE_8COL;
190  }
191 
192  if(bestmode == MODE_SKIP){
193  skips++;
194  no_skips = 0;
195  }
196  if((bestmode != MODE_SKIP && skips) || skips == SKIPS_MAX){
197  bytestream_put_le16(&dst, skips | SKIP_PREFIX);
198  skips = 0;
199  }
200 
201  switch(bestmode){
202  case MODE_FILL:
203  bytestream_put_le16(&dst, MKRGB555(c->avg,0) | 0x8000);
204  for(j = 0; j < 4; j++)
205  for(i = 0; i < 4; i++)
206  for(k = 0; k < 3; k++)
207  prevptr[x*3 + i*3 + k - j*3*avctx->width] = c->avg[k];
208  break;
209  case MODE_2COL:
210  for(j = 0; j < 4; j++){
211  for(i = 0; i < 4; i++){
212  flags |= (c->output[i + j*4]^1) << (i + j*4);
213  for(k = 0; k < 3; k++)
214  prevptr[x*3 + i*3 + k - j*3*avctx->width] = c->codebook[c->output[i + j*4]*3 + k];
215  }
216  }
217  bytestream_put_le16(&dst, flags);
218  bytestream_put_le16(&dst, MKRGB555(c->codebook, 0));
219  bytestream_put_le16(&dst, MKRGB555(c->codebook, 3));
220  break;
221  case MODE_8COL:
222  for(j = 0; j < 4; j++){
223  for(i = 0; i < 4; i++){
224  flags |= (c->output2[remap[i + j*4]]^1) << (i + j*4);
225  for(k = 0; k < 3; k++)
226  prevptr[x*3 + i*3 + k - j*3*avctx->width] = c->codebook2[(c->output2[remap[i+j*4]] + (i&2) + (j&2)*2)*3 + k];
227  }
228  }
229  bytestream_put_le16(&dst, flags);
230  bytestream_put_le16(&dst, MKRGB555(c->codebook2, 0) | 0x8000);
231  for(i = 3; i < 24; i += 3)
232  bytestream_put_le16(&dst, MKRGB555(c->codebook2, i));
233  break;
234  }
235  }
236  src -= p->linesize[0] << 1;
237  prevptr -= avctx->width * 3 * 4;
238  }
239  if(skips)
240  bytestream_put_le16(&dst, skips | SKIP_PREFIX);
241  //EOF
242  bytestream_put_byte(&dst, 0);
243  bytestream_put_byte(&dst, 0);
244 
245  if(no_skips)
246  keyframe = 1;
247  if(keyframe)
248  c->keyint = 0;
249  else
250  c->keyint++;
252  p->key_frame= keyframe;
253  if (keyframe) pkt->flags |= AV_PKT_FLAG_KEY;
254  pkt->size = dst - buf;
255  *got_packet = 1;
256 
257  return 0;
258 }
259 
260 
261 /**
262  * init encoder
263  */
265 {
266  Msvideo1EncContext * const c = avctx->priv_data;
267 
268  c->avctx = avctx;
269  if (av_image_check_size(avctx->width, avctx->height, 0, avctx) < 0) {
270  return -1;
271  }
272  if((avctx->width&3) || (avctx->height&3)){
273  av_log(avctx, AV_LOG_ERROR, "width and height must be multiplies of 4\n");
274  return -1;
275  }
276 
278  avctx->coded_frame = (AVFrame*)&c->pic;
279  avctx->bits_per_coded_sample = 16;
280 
281  c->keyint = avctx->keyint_min;
282  av_lfg_init(&c->rnd, 1);
283 
284  return 0;
285 }
286 
287 
288 
289 /**
290  * Uninit encoder
291  */
293 {
294  Msvideo1EncContext * const c = avctx->priv_data;
295 
296  av_freep(&c->prev);
297 
298  return 0;
299 }
300 
302  .name = "msvideo1",
303  .type = AVMEDIA_TYPE_VIDEO,
304  .id = AV_CODEC_ID_MSVIDEO1,
305  .priv_data_size = sizeof(Msvideo1EncContext),
306  .init = encode_init,
307  .encode2 = encode_frame,
308  .close = encode_end,
309  .pix_fmts = (const enum AVPixelFormat[]){AV_PIX_FMT_RGB555, AV_PIX_FMT_NONE},
310  .long_name = NULL_IF_CONFIG_SMALL("Microsoft Video-1"),
311 };
static av_cold int encode_init(AVCodecContext *avctx)
init encoder
Definition: msvideo1enc.c:264
Definition: lfg.h:25
This structure describes decoded (raw) audio or video data.
Definition: frame.h:76
misc image utilities
int output2[16 *3]
Definition: msvideo1enc.c:47
AVFrame * coded_frame
the picture in the bitstream
static av_cold int init(AVCodecContext *avctx)
Definition: avrndec.c:35
#define FFALIGN(x, a)
Definition: common.h:63
void av_freep(void *arg)
Free a memory block which has been allocated with av_malloc(z)() or av_realloc() and set the pointer ...
Definition: mem.c:198
uint8_t
#define av_cold
Definition: attributes.h:78
static AVPacket pkt
Definition: demuxing.c:56
struct Msvideo1EncContext Msvideo1EncContext
Encoder context.
uint8_t * data
int output[16 *3]
Definition: msvideo1enc.c:46
int bits_per_coded_sample
bits per sample/pixel from the demuxer (needed for huffyuv).
#define AV_PKT_FLAG_KEY
The packet contains a keyframe.
Discrete Time axis x
static int encode_frame(AVCodecContext *avctx, AVPacket *pkt, const AVFrame *pict, int *got_packet)
Definition: msvideo1enc.c:66
#define SKIP_PREFIX
Definition: msvideo1enc.c:60
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
void av_log(void *avcl, int level, const char *fmt,...)
Definition: log.c:246
const char * name
Name of the codec implementation.
int codebook[8 *3]
Definition: msvideo1enc.c:44
external API header
int block2[16 *3]
Definition: msvideo1enc.c:43
int flags
A combination of AV_PKT_FLAG values.
void ff_do_elbg(int *points, int dim, int numpoints, int *codebook, int numCB, int max_steps, int *closest_cb, AVLFG *rand_state)
Implementation of the Enhanced LBG Algorithm Based on the paper "Neural Networks 14:1219-1237" that c...
Definition: elbg.c:354
int av_image_check_size(unsigned int w, unsigned int h, int log_offset, void *log_ctx)
Check if the given dimension of an image is valid, meaning that all bytes of the image can be address...
Definition: imgutils.c:231
enum AVPictureType pict_type
Picture type of the frame.
Definition: frame.h:144
#define FF_MIN_BUFFER_SIZE
minimum encoding buffer size Used to avoid some checks during header writing.
ret
Definition: avfilter.c:821
int width
picture width / height.
t
Definition: genspecsines3.m:6
int quality
quality (between 1 (good) and FF_LAMBDA_MAX (bad))
Definition: frame.h:185
int ff_alloc_packet2(AVCodecContext *avctx, AVPacket *avpkt, int size)
Check AVPacket size and/or allocate data.
for k
AVS_Value src
Definition: avisynth_c.h:523
static const int remap[16]
Definition: msvideo1enc.c:64
static av_cold int encode_end(AVCodecContext *avctx)
Uninit encoder.
Definition: msvideo1enc.c:292
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
Definition: frame.h:101
int codebook2[8 *3]
Definition: msvideo1enc.c:45
main external API structure.
static void close(AVCodecParserContext *s)
Definition: h264_parser.c:375
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:148
void * buf
Definition: avisynth_c.h:594
MSV1Mode
Definition: msvideo1enc.c:53
AVCodec ff_msvideo1_encoder
Definition: msvideo1enc.c:301
void * av_malloc(size_t size)
Allocate a block of size bytes with alignment suitable for all memory accesses (including vectors if ...
Definition: mem.c:73
void avcodec_get_frame_defaults(AVFrame *frame)
Set the fields of the given AVFrame to default values.
synthesis window for stochastic i
av_cold void av_lfg_init(AVLFG *c, unsigned int seed)
Definition: lfg.c:30
#define SKIPS_MAX
Definition: msvideo1enc.c:61
void ff_init_elbg(int *points, int dim, int numpoints, int *codebook, int numCB, int max_steps, int *closest_cb, AVLFG *rand_state)
Initialize the **codebook vector for the elbg algorithm.
Definition: elbg.c:327
static int flags
Definition: cpu.c:23
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:87
int block[16 *3]
Definition: msvideo1enc.c:42
common internal api header.
static double c[64]
#define AV_PIX_FMT_RGB555
Definition: pixfmt.h:269
function y
Definition: D.m:1
AVCodecContext * avctx
Definition: msvideo1enc.c:37
Encoder context.
Definition: msvideo1enc.c:36
else dst[i][x+y *dst_stride[i]]
Definition: vf_mcdeint.c:160
int key_frame
1 -> keyframe, 0-> not
Definition: frame.h:139
#define MKRGB555(in, off)
Definition: msvideo1enc.c:62
#define FFSWAP(type, a, b)
Definition: common.h:61
AVPixelFormat
Pixel format.
Definition: pixfmt.h:66
This structure stores compressed data.
Predicted.
Definition: avutil.h:217
int keyint_min
minimum GOP size