1/*
2 * MPEG-4 / H.263 HW decode acceleration through VA API
3 *
4 * Copyright (C) 2008-2009 Splitted-Desktop Systems
5 *
6 * This file is part of Libav.
7 *
8 * Libav is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
12 *
13 * Libav is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
16 * Lesser General Public License for more details.
17 *
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with Libav; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 */
22
23#include "vaapi_internal.h"
24#include "h263.h"
25
26/** Reconstruct bitstream intra_dc_vlc_thr */
27static int mpeg4_get_intra_dc_vlc_thr(MpegEncContext *s)
28{
29    switch (s->intra_dc_threshold) {
30    case 99: return 0;
31    case 13: return 1;
32    case 15: return 2;
33    case 17: return 3;
34    case 19: return 4;
35    case 21: return 5;
36    case 23: return 6;
37    case 0:  return 7;
38    }
39    return 0;
40}
41
42static int vaapi_mpeg4_start_frame(AVCodecContext *avctx, av_unused const uint8_t *buffer, av_unused uint32_t size)
43{
44    MpegEncContext * const s = avctx->priv_data;
45    struct vaapi_context * const vactx = avctx->hwaccel_context;
46    VAPictureParameterBufferMPEG4 *pic_param;
47    VAIQMatrixBufferMPEG4 *iq_matrix;
48    int i;
49
50    av_dlog(avctx, "vaapi_mpeg4_start_frame()\n");
51
52    vactx->slice_param_size = sizeof(VASliceParameterBufferMPEG4);
53
54    /* Fill in VAPictureParameterBufferMPEG4 */
55    pic_param = ff_vaapi_alloc_pic_param(vactx, sizeof(VAPictureParameterBufferMPEG4));
56    if (!pic_param)
57        return -1;
58    pic_param->vop_width                                = s->width;
59    pic_param->vop_height                               = s->height;
60    pic_param->forward_reference_picture                = VA_INVALID_ID;
61    pic_param->backward_reference_picture               = VA_INVALID_ID;
62    pic_param->vol_fields.value                         = 0; /* reset all bits */
63    pic_param->vol_fields.bits.short_video_header       = avctx->codec->id == CODEC_ID_H263;
64    pic_param->vol_fields.bits.chroma_format            = CHROMA_420;
65    pic_param->vol_fields.bits.interlaced               = !s->progressive_sequence;
66    pic_param->vol_fields.bits.obmc_disable             = 1;
67    pic_param->vol_fields.bits.sprite_enable            = s->vol_sprite_usage;
68    pic_param->vol_fields.bits.sprite_warping_accuracy  = s->sprite_warping_accuracy;
69    pic_param->vol_fields.bits.quant_type               = s->mpeg_quant;
70    pic_param->vol_fields.bits.quarter_sample           = s->quarter_sample;
71    pic_param->vol_fields.bits.data_partitioned         = s->data_partitioning;
72    pic_param->vol_fields.bits.reversible_vlc           = s->rvlc;
73    pic_param->vol_fields.bits.resync_marker_disable    = !s->resync_marker;
74    pic_param->no_of_sprite_warping_points              = s->num_sprite_warping_points;
75    for (i = 0; i < s->num_sprite_warping_points && i < 3; i++) {
76        pic_param->sprite_trajectory_du[i]              = s->sprite_traj[i][0];
77        pic_param->sprite_trajectory_dv[i]              = s->sprite_traj[i][1];
78    }
79    pic_param->quant_precision                          = s->quant_precision;
80    pic_param->vop_fields.value                         = 0; /* reset all bits */
81    pic_param->vop_fields.bits.vop_coding_type          = s->pict_type - AV_PICTURE_TYPE_I;
82    pic_param->vop_fields.bits.backward_reference_vop_coding_type = s->pict_type == AV_PICTURE_TYPE_B ? s->next_picture.f.pict_type - AV_PICTURE_TYPE_I : 0;
83    pic_param->vop_fields.bits.vop_rounding_type        = s->no_rounding;
84    pic_param->vop_fields.bits.intra_dc_vlc_thr         = mpeg4_get_intra_dc_vlc_thr(s);
85    pic_param->vop_fields.bits.top_field_first          = s->top_field_first;
86    pic_param->vop_fields.bits.alternate_vertical_scan_flag = s->alternate_scan;
87    pic_param->vop_fcode_forward                        = s->f_code;
88    pic_param->vop_fcode_backward                       = s->b_code;
89    pic_param->vop_time_increment_resolution            = avctx->time_base.den;
90    pic_param->num_macroblocks_in_gob                   = s->mb_width * ff_h263_get_gob_height(s);
91    pic_param->num_gobs_in_vop                          = (s->mb_width * s->mb_height) / pic_param->num_macroblocks_in_gob;
92    pic_param->TRB                                      = s->pb_time;
93    pic_param->TRD                                      = s->pp_time;
94
95    if (s->pict_type == AV_PICTURE_TYPE_B)
96        pic_param->backward_reference_picture = ff_vaapi_get_surface_id(&s->next_picture);
97    if (s->pict_type != AV_PICTURE_TYPE_I)
98        pic_param->forward_reference_picture  = ff_vaapi_get_surface_id(&s->last_picture);
99
100    /* Fill in VAIQMatrixBufferMPEG4 */
101    /* Only the first inverse quantisation method uses the weighting matrices */
102    if (pic_param->vol_fields.bits.quant_type) {
103        iq_matrix = ff_vaapi_alloc_iq_matrix(vactx, sizeof(VAIQMatrixBufferMPEG4));
104        if (!iq_matrix)
105            return -1;
106        iq_matrix->load_intra_quant_mat         = 1;
107        iq_matrix->load_non_intra_quant_mat     = 1;
108
109        for (i = 0; i < 64; i++) {
110            int n = s->dsp.idct_permutation[ff_zigzag_direct[i]];
111            iq_matrix->intra_quant_mat[i]       = s->intra_matrix[n];
112            iq_matrix->non_intra_quant_mat[i]   = s->inter_matrix[n];
113        }
114    }
115    return 0;
116}
117
118static int vaapi_mpeg4_end_frame(AVCodecContext *avctx)
119{
120    return ff_vaapi_common_end_frame(avctx->priv_data);
121}
122
123static int vaapi_mpeg4_decode_slice(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size)
124{
125    MpegEncContext * const s = avctx->priv_data;
126    VASliceParameterBufferMPEG4 *slice_param;
127
128    av_dlog(avctx, "vaapi_mpeg4_decode_slice(): buffer %p, size %d\n", buffer, size);
129
130    /* video_plane_with_short_video_header() contains all GOBs
131     * in-order, and this is what VA API (Intel backend) expects: only
132     * a single slice param. So fake macroblock_number for Libav so
133     * that we don't call vaapi_mpeg4_decode_slice() again
134     */
135    if (avctx->codec->id == CODEC_ID_H263)
136        size = s->gb.buffer_end - buffer;
137
138    /* Fill in VASliceParameterBufferMPEG4 */
139    slice_param = (VASliceParameterBufferMPEG4 *)ff_vaapi_alloc_slice(avctx->hwaccel_context, buffer, size);
140    if (!slice_param)
141        return -1;
142    slice_param->macroblock_offset      = get_bits_count(&s->gb) % 8;
143    slice_param->macroblock_number      = s->mb_y * s->mb_width + s->mb_x;
144    slice_param->quant_scale            = s->qscale;
145
146    if (avctx->codec->id == CODEC_ID_H263)
147        s->mb_y = s->mb_height;
148
149    return 0;
150}
151
152#if CONFIG_MPEG4_VAAPI_HWACCEL
153AVHWAccel ff_mpeg4_vaapi_hwaccel = {
154    .name           = "mpeg4_vaapi",
155    .type           = AVMEDIA_TYPE_VIDEO,
156    .id             = CODEC_ID_MPEG4,
157    .pix_fmt        = PIX_FMT_VAAPI_VLD,
158    .start_frame    = vaapi_mpeg4_start_frame,
159    .end_frame      = vaapi_mpeg4_end_frame,
160    .decode_slice   = vaapi_mpeg4_decode_slice,
161};
162#endif
163
164#if CONFIG_H263_VAAPI_HWACCEL
165AVHWAccel ff_h263_vaapi_hwaccel = {
166    .name           = "h263_vaapi",
167    .type           = AVMEDIA_TYPE_VIDEO,
168    .id             = CODEC_ID_H263,
169    .pix_fmt        = PIX_FMT_VAAPI_VLD,
170    .start_frame    = vaapi_mpeg4_start_frame,
171    .end_frame      = vaapi_mpeg4_end_frame,
172    .decode_slice   = vaapi_mpeg4_decode_slice,
173};
174#endif
175