82 #define CVID_HEADER_SIZE 10
83 #define STRIP_HEADER_SIZE 12
84 #define CHUNK_HEADER_SIZE 4
86 #define MB_SIZE 4 //4x4 MBs
87 #define MB_AREA (MB_SIZE*MB_SIZE)
89 #define VECTOR_MAX 6 //six or four entries per vector depending on format
90 #define CODEBOOK_MAX 256 //size of a codebook
92 #define MAX_STRIPS 32 //Note: having fewer choices regarding the number of strips speeds up encoding (obviously)
93 #define MIN_STRIPS 1 //Note: having more strips speeds up encoding the frame (this is less obvious)
155 #ifdef CINEPAKENC_DEBUG
157 int num_v1_mode, num_v4_mode, num_mc_mode;
158 int num_v1_encs, num_v4_encs, num_skips;
168 #define OFFSET(x) offsetof(CinepakEncContext, x)
169 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
171 {
"max_extra_cb_iterations",
"Max extra codebook recalculation passes, more is better and slower",
OFFSET(max_extra_cb_iterations),
AV_OPT_TYPE_INT, { .i64 = 2 }, 0, INT_MAX,
VE },
172 {
"skip_empty_cb",
"Avoid wasting bytes, ignore vintage MacOS decoder",
OFFSET(skip_empty_cb),
AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1,
VE },
173 {
"max_strips",
"Limit strips/frame, vintage compatible is 1..3, otherwise the more the better",
OFFSET(max_max_strips),
AV_OPT_TYPE_INT, { .i64 = 3 },
MIN_STRIPS,
MAX_STRIPS,
VE },
174 {
"min_strips",
"Enforce min strips/frame, more is worse and faster, must be <= max_strips",
OFFSET(min_min_strips),
AV_OPT_TYPE_INT, { .i64 =
MIN_STRIPS },
MIN_STRIPS,
MAX_STRIPS,
VE },
175 {
"strip_number_adaptivity",
"How fast the strip number adapts, more is slightly better, much slower",
OFFSET(strip_number_delta_range),
AV_OPT_TYPE_INT, { .i64 = 0 }, 0,
MAX_STRIPS-
MIN_STRIPS,
VE },
189 int x, mb_count, strip_buf_size, frame_buf_size;
192 av_log(avctx,
AV_LOG_ERROR,
"width and height must be multiples of four (got %ix%i)\n",
198 av_log(avctx,
AV_LOG_ERROR,
"minimal number of strips can not exceed maximal (got %i and %i)\n",
242 #ifdef CINEPAKENC_DEBUG
287 #ifdef CINEPAKENC_DEBUG
288 s->num_v1_mode = s->num_v4_mode = s->num_mc_mode = s->num_v1_encs = s->num_v4_encs = s->num_skips = 0;
304 #ifdef CINEPAKENC_DEBUG
315 #ifdef CINEPAK_REPORT_SERR
325 int64_t score1, score2, score3;
332 #ifdef CINEPAK_REPORT_SERR
339 ret += s->
lambda * 8 * mb_count;
342 for(x = 0; x < mb_count; x++) {
345 #ifdef CINEPAK_REPORT_SERR
358 *training_set_v1_shrunk = *training_set_v4_shrunk = 0;
359 for(x = 0; x < mb_count; x++) {
367 #ifdef CINEPAK_REPORT_SERR
372 for(x = 0; x < mb_count; x++) {
377 if(score1 <= score2) {
379 #ifdef CINEPAK_REPORT_SERR
385 #ifdef CINEPAK_REPORT_SERR
397 int v1_shrunk = 0, v4_shrunk = 0;
398 for(x = 0; x < mb_count; x++) {
405 #ifdef CINEPAK_REPORT_SERR
413 #ifdef CINEPAK_REPORT_SERR
418 #ifdef CINEPAK_REPORT_SERR
427 #ifdef CINEPAK_REPORT_SERR
432 #ifdef CINEPAK_REPORT_SERR
438 *training_set_v1_shrunk = v1_shrunk;
439 *training_set_v4_shrunk = v4_shrunk;
441 for(x = 0; x < mb_count; x++) {
447 if(score1 <= score2 && score1 <= score3) {
449 #ifdef CINEPAK_REPORT_SERR
453 }
else if(score2 <= score3) {
455 #ifdef CINEPAK_REPORT_SERR
461 #ifdef CINEPAK_REPORT_SERR
485 int incremental_codebook_replacement_mode = 0;
490 chunk_type_yuv+(incremental_codebook_replacement_mode?1:0) :
491 chunk_type_gray+(incremental_codebook_replacement_mode?1:0),
493 + (incremental_codebook_replacement_mode?(size+31)/32*4:0) );
500 if(incremental_codebook_replacement_mode) {
503 for(x = 0; x <
size; x++) {
509 flags = ((flags>>1) | 0x80000000);
510 for(y = 0; y < entry_size; y++)
511 buf[ret++] = codebook[y + x*entry_size] ^ (y >= 4 ? 0x80 : 0);
512 if((flags&0xffffffff) == 0xffffffff) {
513 AV_WB32(&buf[flagsind], flags);
518 AV_WB32(&buf[flagsind], flags);
520 for(x = 0; x <
size; x++)
521 for(y = 0; y < entry_size; y++)
522 buf[ret++] = codebook[y + x*entry_size] ^ (y >= 4 ? 0x80 : 0);
529 uint8_t * in_data[4],
int in_linesize[4],
530 uint8_t *out_data[4],
int out_linesize[4])
532 out_data[0] = in_data[0] + x + y * in_linesize[0];
533 out_linesize[0] = in_linesize[0];
536 out_data[1] = in_data[1] + (x >> 1) + (y >> 1) * in_linesize[1];
537 out_linesize[1] = in_linesize[1];
539 out_data[2] = in_data[2] + (x >> 1) + (y >> 1) * in_linesize[2];
540 out_linesize[2] = in_linesize[2];
546 int linesize[4],
int v1_vector,
strip_info *info)
552 data[0][ linesize[0]] =
553 data[0][1+ linesize[0]] = info->
v1_codebook[v1_vector*entry_size];
557 data[0][2+ linesize[0]] =
558 data[0][3+ linesize[0]] = info->
v1_codebook[v1_vector*entry_size+1];
560 data[0][2*linesize[0]] =
561 data[0][1+2*linesize[0]] =
562 data[0][ 3*linesize[0]] =
563 data[0][1+3*linesize[0]] = info->
v1_codebook[v1_vector*entry_size+2];
565 data[0][2+2*linesize[0]] =
566 data[0][3+2*linesize[0]] =
567 data[0][2+3*linesize[0]] =
568 data[0][3+3*linesize[0]] = info->
v1_codebook[v1_vector*entry_size+3];
573 data[1][ linesize[1]] =
574 data[1][1+ linesize[1]] = info->
v1_codebook[v1_vector*entry_size+4];
578 data[2][ linesize[2]] =
579 data[2][1+ linesize[2]] = info->
v1_codebook[v1_vector*entry_size+5];
585 int linesize[4],
int *v4_vector,
strip_info *info)
589 for(i = y = 0; y < 4; y += 2) {
590 for(x = 0; x < 4; x += 2, i++) {
591 data[0][x + y*linesize[0]] = info->
v4_codebook[v4_vector[i]*entry_size];
592 data[0][x+1 + y*linesize[0]] = info->
v4_codebook[v4_vector[i]*entry_size+1];
593 data[0][x + (y+1)*linesize[0]] = info->
v4_codebook[v4_vector[i]*entry_size+2];
594 data[0][x+1 + (y+1)*linesize[0]] = info->
v4_codebook[v4_vector[i]*entry_size+3];
597 data[1][(x>>1) + (y>>1)*linesize[1]] = info->
v4_codebook[v4_vector[i]*entry_size+4];
598 data[2][(x>>1) + (y>>1)*linesize[2]] = info->
v4_codebook[v4_vector[i]*entry_size+5];
605 uint8_t *a_data[4],
int a_linesize[4],
606 uint8_t *b_data[4],
int b_linesize[4])
611 memcpy(a_data[0]+y*a_linesize[0], b_data[0]+y*b_linesize[0],
616 for(p = 1; p <= 2; p++) {
617 for(y = 0; y < MB_SIZE/2; y++) {
618 memcpy(a_data[p] + y*a_linesize[p],
619 b_data[p] + y*b_linesize[p],
627 uint8_t *scratch_data[4],
int scratch_linesize[4],
628 uint8_t *last_data[4],
int last_linesize[4],
631 int x, y, z,
flags,
bits, temp_size, header_ofs, ret = 0, mb_count = s->
w * h /
MB_AREA;
632 int needs_extra_bit, should_write_temp;
633 unsigned char temp[64];
635 uint8_t *sub_scratch_data[4] = {0}, *sub_last_data[4] = {0};
636 int sub_scratch_linesize[4] = {0}, sub_last_linesize[4] = {0};
649 for(z = y = 0; y <
h; y +=
MB_SIZE) {
650 for(x = 0; x < s->
w; x +=
MB_SIZE, z++) {
654 sub_scratch_data, sub_scratch_linesize);
658 last_data, last_linesize,
659 sub_last_data, sub_last_linesize);
660 copy_mb(s, sub_scratch_data, sub_scratch_linesize,
661 sub_last_data, sub_last_linesize);
676 for(x = 0; x < mb_count; x++)
685 for(x = 0; x < mb_count; x += 32) {
687 for(y = x; y <
FFMIN(x+32, mb_count); y++)
689 flags |= 1 << (31 - y + x);
694 for(y = x; y <
FFMIN(x+32, mb_count); y++) {
700 for(z = 0; z < 4; z++)
712 flags = bits = temp_size = 0;
714 for(x = 0; x < mb_count; x++) {
718 should_write_temp = 0;
733 memcpy(&buf[ret], temp, temp_size);
737 should_write_temp = 1;
740 if(needs_extra_bit) {
748 for(z = 0; z < 4; z++)
751 if(should_write_temp) {
752 memcpy(&buf[ret], temp, temp_size);
761 memcpy(&buf[ret], temp, temp_size);
775 uint8_t *a_data[4],
int a_linesize[4],
776 uint8_t *b_data[4],
int b_linesize[4])
778 int x, y, p, d, ret = 0;
782 d = a_data[0][x + y*a_linesize[0]] - b_data[0][x + y*b_linesize[0]];
788 for(p = 1; p <= 2; p++) {
789 for(y = 0; y < MB_SIZE/2; y++) {
790 for(x = 0; x < MB_SIZE/2; x++) {
791 d = a_data[p][x + y*a_linesize[p]] - b_data[p][x + y*b_linesize[p]];
802 #define CERTAIN(x) ((x)!=ENC_UNCERTAIN)
808 int x, y, i, j, k, x2, y2, x3, y3,
plane,
shift, mbn;
812 int64_t total_error = 0;
814 uint8_t *sub_data [4], *vq_data [4];
815 int sub_linesize[4], vq_linesize[4];
817 for(mbn = i = y = 0; y <
h; y +=
MB_SIZE) {
818 for(x = 0; x < s->
w; x +=
MB_SIZE, ++mbn) {
829 for(j = y2 = 0; y2 < entry_size; y2 += 2) {
830 for(x2 = 0; x2 < 4; x2 += 2, j++) {
831 plane = y2 < 4 ? 0 : 1 + (x2 >> 1);
832 shift = y2 < 4 ? 0 : 1;
835 base[j] = (data[
plane][((x+x3) >> shift) + ((y+y3) >> shift) * linesize[
plane]] +
836 data[
plane][((x+x3) >> shift) + 1 + ((y+y3) >> shift) * linesize[
plane]] +
837 data[
plane][((x+x3) >> shift) + (((y+y3) >> shift) + 1) * linesize[plane]] +
838 data[plane][((x+x3) >>
shift) + 1 + (((y+y3) >>
shift) + 1) * linesize[
plane]]) >> 2;
843 for(j = y2 = 0; y2 <
MB_SIZE; y2 += 2) {
844 for(x2 = 0; x2 <
MB_SIZE; x2 += 2) {
845 for(k = 0; k < entry_size; k++, j++) {
846 plane = k >= 4 ? k - 3 : 0;
852 x3 = x + x2 + (k & 1);
853 y3 = y + y2 + (k >> 1);
856 base[j] = data[
plane][x3 + y3*linesize[
plane]];
879 vq_data[0] = vq_pict_buf;
881 vq_data[1] = &vq_pict_buf[
MB_AREA];
882 vq_data[2] = vq_data[1] + (
MB_AREA >> 2);
883 vq_linesize[1] = vq_linesize[2] =
MB_SIZE >> 1;
886 for(i = j = y = 0; y <
h; y +=
MB_SIZE) {
887 for(x = 0; x < s->
w; x +=
MB_SIZE, j++) {
903 vq_data, vq_linesize);
906 for(k = 0; k < 4; k++)
913 vq_data, vq_linesize);
928 uint8_t *last_data[4],
int last_linesize[4],
933 uint8_t *sub_last_data [4], *sub_pict_data [4];
934 int sub_last_linesize[4], sub_pict_linesize[4];
936 for(i = y = 0; y <
h; y +=
MB_SIZE) {
937 for(x = 0; x < s->
w; x +=
MB_SIZE, i++) {
939 sub_last_data, sub_last_linesize);
941 sub_pict_data, sub_pict_linesize);
944 sub_last_data, sub_last_linesize,
945 sub_pict_data, sub_pict_linesize);
957 buf[0] = keyframe ? 0x10: 0x11;
969 uint8_t *last_data[4],
int last_linesize[4],
971 uint8_t *scratch_data[4],
int scratch_linesize[4],
972 unsigned char *
buf, int64_t *best_score
973 #ifdef CINEPAK_REPORT_SERR
979 #ifdef CINEPAK_REPORT_SERR
985 int v1enough, v1_size, v4enough, v4_size;
986 int new_v1_size, new_v4_size;
987 int v1shrunk, v4shrunk;
997 #define SMALLEST_CODEBOOK 1
999 for(v4enough = 0, v4_size = 0; v4_size <= v1_size && !v4enough; v4_size = v4_size ? v4_size << 2 : v1_size >= SMALLEST_CODEBOOK << 2 ? v1_size >> 2 :
SMALLEST_CODEBOOK) {
1034 &v1shrunk, &v4shrunk
1035 #ifdef CINEPAK_REPORT_SERR
1046 if(new_v1_size < info.
v1_size){
1053 if(new_v4_size < info.
v4_size) {
1063 &v1shrunk, &v4shrunk
1064 #ifdef CINEPAK_REPORT_SERR
1069 if((!v1shrunk && !v4shrunk) || !extra_iterations_limit--)
break;
1074 if(new_v1_size < info.
v1_size){
1082 if(new_v4_size < info.
v4_size) {
1092 if(best_size == 0 || score < *best_score) {
1094 *best_score = score;
1095 #ifdef CINEPAK_REPORT_SERR
1099 scratch_data, scratch_linesize,
1100 last_data, last_linesize, &info,
1105 #ifdef CINEPAK_REPORT_SERR
1109 #ifdef CINEPAKENC_DEBUG
1111 memcpy(s->best_mb, s->
mb, mb_count*
sizeof(
mb_info));
1122 #ifdef CINEPAKENC_DEBUG
1134 for(x = 0; x < s->
w*h/
MB_AREA; x++)
1135 if(s->best_mb[x].best_encoding ==
ENC_V1)
1137 else if(s->best_mb[x].best_encoding ==
ENC_V4)
1152 buf[0] = isakeyframe ? 0 : 1;
1162 int isakeyframe,
unsigned char *
buf,
int buf_size)
1164 int num_strips, strip, i, y, nexty,
size, temp_size;
1165 uint8_t *last_data [4], *
data [4], *scratch_data [4];
1166 int last_linesize[4], linesize[4], scratch_linesize[4];
1167 int64_t best_score = 0, score, score_temp;
1168 #ifdef CINEPAK_REPORT_SERR
1169 int64_t best_serr = 0, serr, serr_temp;
1172 int best_nstrips = -1, best_size = -1;
1177 for(y = 0; y < s->
h; y += 2) {
1178 for(x = 0; x < s->
w; x += 2) {
1181 ir[1] = ir[0] + frame->
linesize[0];
1184 scratch_data, scratch_linesize);
1186 for(i=0; i<4; ++i) {
1188 i1 = (i&1); i2 = (i>=2);
1189 rr = ir[i2][i1*3+0];
1190 gg = ir[i2][i1*3+1];
1191 bb = ir[i2][i1*3+2];
1192 r += rr; g += gg; b += bb;
1196 rr = (2396625*rr + 4793251*gg + 1198732*bb) >> 23;
1198 else if (rr > 255) rr = 255;
1199 scratch_data[0][i1 + i2*scratch_linesize[0]] = rr;
1205 rr = (-299683*r - 599156*g + 898839*
b) >> 23;
1206 if( rr < -128) rr = -128;
1207 else if (rr > 127) rr = 127;
1208 scratch_data[1][0] = rr + 128;
1211 rr = (748893*r - 599156*g - 149737*
b) >> 23;
1212 if( rr < -128) rr = -128;
1213 else if (rr > 127) rr = 127;
1214 scratch_data[2][0] = rr + 128;
1221 for(num_strips = s->
min_strips; num_strips <= s->max_strips && num_strips <= s->
h /
MB_SIZE; num_strips++) {
1224 #ifdef CINEPAK_REPORT_SERR
1228 for(y = 0, strip = 1; y < s->
h; strip++, y = nexty) {
1231 nexty = strip * s->
h / num_strips;
1234 nexty += 4 - (nexty & 3);
1236 strip_height = nexty - y;
1237 if(strip_height <= 0) {
1252 last_data, last_linesize);
1255 scratch_data, scratch_linesize);
1257 if((temp_size =
rd_strip(s, y, strip_height, isakeyframe,
1258 last_data, last_linesize, data, linesize,
1259 scratch_data, scratch_linesize,
1261 #ifdef CINEPAK_REPORT_SERR
1267 score += score_temp;
1268 #ifdef CINEPAK_REPORT_SERR
1276 if(best_score == 0 || score < best_score) {
1278 #ifdef CINEPAK_REPORT_SERR
1283 #ifdef CINEPAK_REPORT_SERR
1284 av_log(s->
avctx,
AV_LOG_INFO,
"best number of strips so far: %2i, %12"PRId64
", %i B\n", num_strips, serr, best_size);
1289 best_nstrips = num_strips;
1293 if(num_strips - best_nstrips > 4)
1297 av_assert0(best_nstrips >= 0 && best_size >= 0);
1364 #ifdef CINEPAKENC_DEBUG
1371 #ifdef CINEPAKENC_DEBUG
1372 av_log(avctx,
AV_LOG_INFO,
"strip coding stats: %i V1 mode, %i V4 mode, %i MC mode (%i V1 encs, %i V4 encs, %i skips)\n",
1373 s->num_v1_mode, s->num_v4_mode, s->num_mc_mode, s->num_v1_encs, s->num_v4_encs, s->num_skips);
static enum AVPixelFormat pix_fmt
static int shift(int a, int b)
This structure describes decoded (raw) audio or video data.
ptrdiff_t const GLvoid * data
static void calculate_skip_errors(CinepakEncContext *s, int h, uint8_t *last_data[4], int last_linesize[4], uint8_t *data[4], int linesize[4], strip_info *info)
#define LIBAVUTIL_VERSION_INT
packed RGB 8:8:8, 24bpp, RGBRGB...
static av_cold int init(AVCodecContext *avctx)
static int cinepak_encode_frame(AVCodecContext *avctx, AVPacket *pkt, const AVFrame *frame, int *got_packet)
static void write_strip_header(CinepakEncContext *s, int y, int h, int keyframe, unsigned char *buf, int strip_size)
int strip_number_delta_range
enum AVPixelFormat pix_fmt
Pixel format, see AV_PIX_FMT_xxx.
static void get_sub_picture(CinepakEncContext *s, int x, int y, uint8_t *in_data[4], int in_linesize[4], uint8_t *out_data[4], int out_linesize[4])
int v1_codebook[CODEBOOK_MAX *VECTOR_MAX]
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
#define av_assert0(cond)
assert() equivalent, that is always enabled.
static int compute_mb_distortion(CinepakEncContext *s, uint8_t *a_data[4], int a_linesize[4], uint8_t *b_data[4], int b_linesize[4])
AVFrame * av_frame_alloc(void)
Allocate an AVFrame and set its fields to default values.
#define CHUNK_HEADER_SIZE
static int rd_strip(CinepakEncContext *s, int y, int h, int keyframe, uint8_t *last_data[4], int last_linesize[4], uint8_t *data[4], int linesize[4], uint8_t *scratch_data[4], int scratch_linesize[4], unsigned char *buf, int64_t *best_score)
int avpriv_do_elbg(int *points, int dim, int numpoints, int *codebook, int numCB, int max_steps, int *closest_cb, AVLFG *rand_state)
Implementation of the Enhanced LBG Algorithm Based on the paper "Neural Networks 14:1219-1237" that c...
#define SMALLEST_CODEBOOK
int v4_codebook[CODEBOOK_MAX *VECTOR_MAX]
static const AVOption options[]
#define AV_PKT_FLAG_KEY
The packet contains a keyframe.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
unsigned char * frame_buf
static void copy_mb(CinepakEncContext *s, uint8_t *a_data[4], int a_linesize[4], uint8_t *b_data[4], int b_linesize[4])
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
simple assert() macros that are a bit more flexible than ISO C assert().
const char * name
Name of the codec implementation.
static void decode_v1_vector(CinepakEncContext *s, uint8_t *data[4], int linesize[4], int v1_vector, strip_info *info)
int flags
A combination of AV_PKT_FLAG values.
static av_cold int cinepak_encode_init(AVCodecContext *avctx)
int width
picture width / height.
static int write_chunk_header(unsigned char *buf, int chunk_type, int chunk_size)
static void decode_v4_vector(CinepakEncContext *s, uint8_t *data[4], int linesize[4], int *v4_vector, strip_info *info)
int quality
quality (between 1 (good) and FF_LAMBDA_MAX (bad))
#define AV_LOG_INFO
Standard information.
mb_encoding best_encoding
int avpriv_init_elbg(int *points, int dim, int numpoints, int *codebook, int numCB, int max_steps, int *closest_cb, AVLFG *rand_state)
Initialize the **codebook vector for the elbg algorithm.
Libavcodec external API header.
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
main external API structure.
AVCodec ff_cinepak_encoder
Describe the class of an AVClass context structure.
#define STRIP_HEADER_SIZE
av_cold void av_lfg_init(AVLFG *c, unsigned int seed)
static int encode_codebook(CinepakEncContext *s, int *codebook, int size, int chunk_type_yuv, int chunk_type_gray, unsigned char *buf)
int ff_alloc_packet2(AVCodecContext *avctx, AVPacket *avpkt, int64_t size, int64_t min_size)
Check AVPacket size and/or allocate data.
static int encode_mode(CinepakEncContext *s, int h, uint8_t *scratch_data[4], int scratch_linesize[4], uint8_t *last_data[4], int last_linesize[4], strip_info *info, unsigned char *buf)
static const AVClass cinepak_class
static enum AVPixelFormat pix_fmts[]
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
int max_extra_cb_iterations
common internal api header.
static int quantize(CinepakEncContext *s, int h, uint8_t *data[4], int linesize[4], int v1mode, strip_info *info, mb_encoding encoding)
unsigned char * strip_buf
unsigned char * pict_bufs[4]
static int rd_frame(CinepakEncContext *s, const AVFrame *frame, int isakeyframe, unsigned char *buf, int buf_size)
static int64_t calculate_mode_score(CinepakEncContext *s, int h, strip_info *info, int report, int *training_set_v1_shrunk, int *training_set_v4_shrunk)
#define av_malloc_array(a, b)
#define FFSWAP(type, a, b)
AVPixelFormat
Pixel format.
This structure stores compressed data.
enum AVPixelFormat pix_fmt
static av_cold int cinepak_encode_end(AVCodecContext *avctx)
static int write_cvid_header(CinepakEncContext *s, unsigned char *buf, int num_strips, int data_size, int isakeyframe)
int keyint_min
minimum GOP size