| /* |
| * Copyright (c) 2010 The WebM project authors. All Rights Reserved. |
| * |
| * Use of this source code is governed by a BSD-style license |
| * that can be found in the LICENSE file in the root of the source |
| * tree. An additional intellectual property rights grant can be found |
| * in the file PATENTS. All contributing project authors may |
| * be found in the AUTHORS file in the root of the source tree. |
| */ |
| |
| |
| #include "onyxc_int.h" |
| #include "onyx_int.h" |
| #include "quantize.h" |
| #include "vpx_mem/vpx_mem.h" |
| #include "vpx_scale/yv12extend.h" |
| #include "vpx_scale/vpxscale.h" |
| #include "alloccommon.h" |
| #if ARCH_ARM |
| #include "vpx_ports/arm.h" |
| #endif |
| |
| extern void vp8_loop_filter_frame(VP8_COMMON *cm, MACROBLOCKD *mbd, int filt_val); |
| extern void vp8_loop_filter_frame_yonly(VP8_COMMON *cm, MACROBLOCKD *mbd, int filt_val, int sharpness_lvl); |
| extern int vp8_calc_ss_err(YV12_BUFFER_CONFIG *source, YV12_BUFFER_CONFIG *dest, const vp8_variance_rtcd_vtable_t *rtcd); |
| #if HAVE_ARMV7 |
| extern void vp8_yv12_copy_frame_yonly_no_extend_frame_borders_neon(YV12_BUFFER_CONFIG *src_ybc, YV12_BUFFER_CONFIG *dst_ybc); |
| #endif |
| |
| #if CONFIG_RUNTIME_CPU_DETECT |
| #define IF_RTCD(x) (x) |
| #else |
| #define IF_RTCD(x) NULL |
| #endif |
| |
| extern void |
| (*vp8_yv12_copy_partial_frame_ptr)(YV12_BUFFER_CONFIG *src_ybc, |
| YV12_BUFFER_CONFIG *dst_ybc, |
| int Fraction); |
| void |
| vp8_yv12_copy_partial_frame(YV12_BUFFER_CONFIG *src_ybc, YV12_BUFFER_CONFIG *dst_ybc, int Fraction) |
| { |
| unsigned char *src_y, *dst_y; |
| int yheight; |
| int ystride; |
| int border; |
| int yoffset; |
| int linestocopy; |
| |
| border = src_ybc->border; |
| yheight = src_ybc->y_height; |
| ystride = src_ybc->y_stride; |
| |
| linestocopy = (yheight >> (Fraction + 4)); |
| |
| if (linestocopy < 1) |
| linestocopy = 1; |
| |
| linestocopy <<= 4; |
| |
| yoffset = ystride * ((yheight >> 5) * 16 - 8); |
| src_y = src_ybc->y_buffer + yoffset; |
| dst_y = dst_ybc->y_buffer + yoffset; |
| |
| vpx_memcpy(dst_y, src_y, ystride *(linestocopy + 16)); |
| } |
| |
| static int vp8_calc_partial_ssl_err(YV12_BUFFER_CONFIG *source, YV12_BUFFER_CONFIG *dest, int Fraction, const vp8_variance_rtcd_vtable_t *rtcd) |
| { |
| int i, j; |
| int Total = 0; |
| int srcoffset, dstoffset; |
| unsigned char *src = source->y_buffer; |
| unsigned char *dst = dest->y_buffer; |
| |
| int linestocopy = (source->y_height >> (Fraction + 4)); |
| (void)rtcd; |
| |
| if (linestocopy < 1) |
| linestocopy = 1; |
| |
| linestocopy <<= 4; |
| |
| |
| srcoffset = source->y_stride * (dest->y_height >> 5) * 16; |
| dstoffset = dest->y_stride * (dest->y_height >> 5) * 16; |
| |
| src += srcoffset; |
| dst += dstoffset; |
| |
| // Loop through the Y plane raw and reconstruction data summing (square differences) |
| for (i = 0; i < linestocopy; i += 16) |
| { |
| for (j = 0; j < source->y_width; j += 16) |
| { |
| unsigned int sse; |
| Total += VARIANCE_INVOKE(rtcd, mse16x16)(src + j, source->y_stride, dst + j, dest->y_stride, &sse); |
| } |
| |
| src += 16 * source->y_stride; |
| dst += 16 * dest->y_stride; |
| } |
| |
| return Total; |
| } |
| |
| extern void vp8_loop_filter_partial_frame |
| ( |
| VP8_COMMON *cm, |
| MACROBLOCKD *mbd, |
| int default_filt_lvl, |
| int sharpness_lvl, |
| int Fraction |
| ); |
| |
| // Enforce a minimum filter level based upon baseline Q |
| static int get_min_filter_level(VP8_COMP *cpi, int base_qindex) |
| { |
| int min_filter_level; |
| |
| if (cpi->source_alt_ref_active && cpi->common.refresh_golden_frame && !cpi->common.refresh_alt_ref_frame) |
| min_filter_level = 0; |
| else |
| { |
| if (base_qindex <= 6) |
| min_filter_level = 0; |
| else if (base_qindex <= 16) |
| min_filter_level = 1; |
| else |
| min_filter_level = (base_qindex / 8); |
| } |
| |
| return min_filter_level; |
| } |
| |
| // Enforce a maximum filter level based upon baseline Q |
| static int get_max_filter_level(VP8_COMP *cpi, int base_qindex) |
| { |
| // PGW August 2006: Highest filter values almost always a bad idea |
| |
| // jbb chg: 20100118 - not so any more with this overquant stuff allow high values |
| // with lots of intra coming in. |
| int max_filter_level = MAX_LOOP_FILTER ;//* 3 / 4; |
| |
| if (cpi->section_intra_rating > 8) |
| max_filter_level = MAX_LOOP_FILTER * 3 / 4; |
| |
| (void) cpi; |
| (void) base_qindex; |
| |
| return max_filter_level; |
| } |
| |
| void vp8cx_pick_filter_level_fast(YV12_BUFFER_CONFIG *sd, VP8_COMP *cpi) |
| { |
| VP8_COMMON *cm = &cpi->common; |
| |
| int best_err = 0; |
| int filt_err = 0; |
| int min_filter_level = 0; |
| int max_filter_level = MAX_LOOP_FILTER * 3 / 4; // PGW August 2006: Highest filter values almost always a bad idea |
| int filt_val; |
| int best_filt_val = cm->filter_level; |
| |
| // Make a copy of the unfiltered / processed recon buffer |
| //vp8_yv12_copy_frame_ptr( cm->frame_to_show, &cpi->last_frame_uf ); |
| vp8_yv12_copy_partial_frame_ptr(cm->frame_to_show, &cpi->last_frame_uf, 3); |
| |
| if (cm->frame_type == KEY_FRAME) |
| cm->sharpness_level = 0; |
| else |
| cm->sharpness_level = cpi->oxcf.Sharpness; |
| |
| // Enforce a minimum filter level based upon Q |
| min_filter_level = get_min_filter_level(cpi, cm->base_qindex); |
| max_filter_level = get_max_filter_level(cpi, cm->base_qindex); |
| |
| // Start the search at the previous frame filter level unless it is now out of range. |
| if (cm->filter_level < min_filter_level) |
| cm->filter_level = min_filter_level; |
| else if (cm->filter_level > max_filter_level) |
| cm->filter_level = max_filter_level; |
| |
| filt_val = cm->filter_level; |
| best_filt_val = filt_val; |
| |
| // Set up alternate filter values |
| |
| // Get the err using the previous frame's filter value. |
| vp8_loop_filter_partial_frame(cm, &cpi->mb.e_mbd, filt_val, 0 , 3); |
| cm->last_frame_type = cm->frame_type; |
| cm->last_filter_type = cm->filter_type; |
| cm->last_sharpness_level = cm->sharpness_level; |
| |
| best_err = vp8_calc_partial_ssl_err(sd, cm->frame_to_show, 3, IF_RTCD(&cpi->rtcd.variance)); |
| |
| // Re-instate the unfiltered frame |
| vp8_yv12_copy_partial_frame_ptr(&cpi->last_frame_uf, cm->frame_to_show, 3); |
| |
| filt_val -= (1 + ((filt_val > 10) ? 1 : 0)); |
| |
| // Search lower filter levels |
| while (filt_val >= min_filter_level) |
| { |
| // Apply the loop filter |
| vp8_loop_filter_partial_frame(cm, &cpi->mb.e_mbd, filt_val, 0, 3); |
| cm->last_frame_type = cm->frame_type; |
| cm->last_filter_type = cm->filter_type; |
| cm->last_sharpness_level = cm->sharpness_level; |
| |
| // Get the err for filtered frame |
| filt_err = vp8_calc_partial_ssl_err(sd, cm->frame_to_show, 3, IF_RTCD(&cpi->rtcd.variance)); |
| |
| |
| // Re-instate the unfiltered frame |
| vp8_yv12_copy_partial_frame_ptr(&cpi->last_frame_uf, cm->frame_to_show, 3); |
| |
| |
| // Update the best case record or exit loop. |
| if (filt_err < best_err) |
| { |
| best_err = filt_err; |
| best_filt_val = filt_val; |
| } |
| else |
| break; |
| |
| // Adjust filter level |
| filt_val -= (1 + ((filt_val > 10) ? 1 : 0)); |
| } |
| |
| // Search up (note that we have already done filt_val = cm->filter_level) |
| filt_val = cm->filter_level + (1 + ((filt_val > 10) ? 1 : 0)); |
| |
| if (best_filt_val == cm->filter_level) |
| { |
| // Resist raising filter level for very small gains |
| best_err -= (best_err >> 10); |
| |
| while (filt_val < max_filter_level) |
| { |
| // Apply the loop filter |
| vp8_loop_filter_partial_frame(cm, &cpi->mb.e_mbd, filt_val, 0, 3); |
| cm->last_frame_type = cm->frame_type; |
| cm->last_filter_type = cm->filter_type; |
| cm->last_sharpness_level = cm->sharpness_level; |
| |
| // Get the err for filtered frame |
| filt_err = vp8_calc_partial_ssl_err(sd, cm->frame_to_show, 3, IF_RTCD(&cpi->rtcd.variance)); |
| |
| // Re-instate the unfiltered frame |
| vp8_yv12_copy_partial_frame_ptr(&cpi->last_frame_uf, cm->frame_to_show, 3); |
| |
| // Update the best case record or exit loop. |
| if (filt_err < best_err) |
| { |
| // Do not raise filter level if improvement is < 1 part in 4096 |
| best_err = filt_err - (filt_err >> 10); |
| |
| best_filt_val = filt_val; |
| } |
| else |
| break; |
| |
| // Adjust filter level |
| filt_val += (1 + ((filt_val > 10) ? 1 : 0)); |
| } |
| } |
| |
| cm->filter_level = best_filt_val; |
| |
| if (cm->filter_level < min_filter_level) |
| cm->filter_level = min_filter_level; |
| |
| if (cm->filter_level > max_filter_level) |
| cm->filter_level = max_filter_level; |
| } |
| |
| // Stub function for now Alt LF not used |
| void vp8cx_set_alt_lf_level(VP8_COMP *cpi, int filt_val) |
| { |
| MACROBLOCKD *mbd = &cpi->mb.e_mbd; |
| (void) filt_val; |
| |
| mbd->segment_feature_data[MB_LVL_ALT_LF][0] = cpi->segment_feature_data[MB_LVL_ALT_LF][0]; |
| mbd->segment_feature_data[MB_LVL_ALT_LF][1] = cpi->segment_feature_data[MB_LVL_ALT_LF][1]; |
| mbd->segment_feature_data[MB_LVL_ALT_LF][2] = cpi->segment_feature_data[MB_LVL_ALT_LF][2]; |
| mbd->segment_feature_data[MB_LVL_ALT_LF][3] = cpi->segment_feature_data[MB_LVL_ALT_LF][3]; |
| } |
| |
| void vp8cx_pick_filter_level(YV12_BUFFER_CONFIG *sd, VP8_COMP *cpi) |
| { |
| VP8_COMMON *cm = &cpi->common; |
| |
| int best_err = 0; |
| int filt_err = 0; |
| int min_filter_level; |
| int max_filter_level; |
| int prediction_difference = (int)(100 * abs((int)(cpi->last_auto_filter_prediction_error - cpi->prediction_error)) / (1 + cpi->prediction_error)); |
| |
| int filter_step; |
| int filt_high = 0; |
| int filt_mid = cm->filter_level; // Start search at previous frame filter level |
| int filt_low = 0; |
| int filt_best; |
| int filt_direction = 0; |
| |
| int Bias = 0; // Bias against raising loop filter and in favour of lowering it |
| |
| // Make a copy of the unfiltered / processed recon buffer |
| #if HAVE_ARMV7 |
| #if CONFIG_RUNTIME_CPU_DETECT |
| if (cm->rtcd.flags & HAS_NEON) |
| #endif |
| { |
| vp8_yv12_copy_frame_yonly_no_extend_frame_borders_neon(cm->frame_to_show, &cpi->last_frame_uf); |
| } |
| #if CONFIG_RUNTIME_CPU_DETECT |
| else |
| #endif |
| #endif |
| #if !HAVE_ARMV7 || CONFIG_RUNTIME_CPU_DETECT |
| { |
| vp8_yv12_copy_frame_ptr(cm->frame_to_show, &cpi->last_frame_uf); |
| } |
| #endif |
| |
| if (cm->frame_type == KEY_FRAME) |
| cm->sharpness_level = 0; |
| else |
| cm->sharpness_level = cpi->oxcf.Sharpness; |
| |
| // Enforce a minimum filter level based upon Q |
| min_filter_level = get_min_filter_level(cpi, cm->base_qindex); |
| max_filter_level = get_max_filter_level(cpi, cm->base_qindex); |
| |
| // Start the search at the previous frame filter level unless it is now out of range. |
| filt_mid = cm->filter_level; |
| |
| if (filt_mid < min_filter_level) |
| filt_mid = min_filter_level; |
| else if (filt_mid > max_filter_level) |
| filt_mid = max_filter_level; |
| |
| // Define the initial step size |
| filter_step = (filt_mid < 16) ? 4 : filt_mid / 4; |
| |
| // Get baseline error score |
| vp8cx_set_alt_lf_level(cpi, filt_mid); |
| vp8_loop_filter_frame_yonly(cm, &cpi->mb.e_mbd, filt_mid, 0); |
| cm->last_frame_type = cm->frame_type; |
| cm->last_filter_type = cm->filter_type; |
| cm->last_sharpness_level = cm->sharpness_level; |
| |
| best_err = vp8_calc_ss_err(sd, cm->frame_to_show, IF_RTCD(&cpi->rtcd.variance)); |
| filt_best = filt_mid; |
| |
| // Re-instate the unfiltered frame |
| #if HAVE_ARMV7 |
| #if CONFIG_RUNTIME_CPU_DETECT |
| if (cm->rtcd.flags & HAS_NEON) |
| #endif |
| { |
| vp8_yv12_copy_frame_yonly_no_extend_frame_borders_neon(&cpi->last_frame_uf, cm->frame_to_show); |
| } |
| #if CONFIG_RUNTIME_CPU_DETECT |
| else |
| #endif |
| #endif |
| #if !HAVE_ARMV7 || CONFIG_RUNTIME_CPU_DETECT |
| { |
| vp8_yv12_copy_frame_yonly_ptr(&cpi->last_frame_uf, cm->frame_to_show); |
| } |
| #endif |
| |
| while (filter_step > 0) |
| { |
| Bias = (best_err >> (15 - (filt_mid / 8))) * filter_step; //PGW change 12/12/06 for small images |
| |
| // jbb chg: 20100118 - in sections with lots of new material coming in don't bias as much to a low filter value |
| if (cpi->section_intra_rating < 20) |
| Bias = Bias * cpi->section_intra_rating / 20; |
| |
| filt_high = ((filt_mid + filter_step) > max_filter_level) ? max_filter_level : (filt_mid + filter_step); |
| filt_low = ((filt_mid - filter_step) < min_filter_level) ? min_filter_level : (filt_mid - filter_step); |
| |
| if ((filt_direction <= 0) && (filt_low != filt_mid)) |
| { |
| // Get Low filter error score |
| vp8cx_set_alt_lf_level(cpi, filt_low); |
| vp8_loop_filter_frame_yonly(cm, &cpi->mb.e_mbd, filt_low, 0); |
| cm->last_frame_type = cm->frame_type; |
| cm->last_filter_type = cm->filter_type; |
| cm->last_sharpness_level = cm->sharpness_level; |
| |
| filt_err = vp8_calc_ss_err(sd, cm->frame_to_show, IF_RTCD(&cpi->rtcd.variance)); |
| |
| // Re-instate the unfiltered frame |
| #if HAVE_ARMV7 |
| #if CONFIG_RUNTIME_CPU_DETECT |
| if (cm->rtcd.flags & HAS_NEON) |
| #endif |
| { |
| vp8_yv12_copy_frame_yonly_no_extend_frame_borders_neon(&cpi->last_frame_uf, cm->frame_to_show); |
| } |
| #if CONFIG_RUNTIME_CPU_DETECT |
| else |
| #endif |
| #endif |
| #if !HAVE_ARMV7 || CONFIG_RUNTIME_CPU_DETECT |
| { |
| vp8_yv12_copy_frame_yonly_ptr(&cpi->last_frame_uf, cm->frame_to_show); |
| } |
| #endif |
| |
| // If value is close to the best so far then bias towards a lower loop filter value. |
| if ((filt_err - Bias) < best_err) |
| { |
| // Was it actually better than the previous best? |
| if (filt_err < best_err) |
| best_err = filt_err; |
| |
| filt_best = filt_low; |
| } |
| } |
| |
| // Now look at filt_high |
| if ((filt_direction >= 0) && (filt_high != filt_mid)) |
| { |
| vp8cx_set_alt_lf_level(cpi, filt_high); |
| vp8_loop_filter_frame_yonly(cm, &cpi->mb.e_mbd, filt_high, 0); |
| cm->last_frame_type = cm->frame_type; |
| cm->last_filter_type = cm->filter_type; |
| cm->last_sharpness_level = cm->sharpness_level; |
| |
| filt_err = vp8_calc_ss_err(sd, cm->frame_to_show, IF_RTCD(&cpi->rtcd.variance)); |
| |
| // Re-instate the unfiltered frame |
| #if HAVE_ARMV7 |
| #if CONFIG_RUNTIME_CPU_DETECT |
| if (cm->rtcd.flags & HAS_NEON) |
| #endif |
| { |
| vp8_yv12_copy_frame_yonly_no_extend_frame_borders_neon(&cpi->last_frame_uf, cm->frame_to_show); |
| } |
| #if CONFIG_RUNTIME_CPU_DETECT |
| else |
| #endif |
| #endif |
| #if !HAVE_ARMV7 || CONFIG_RUNTIME_CPU_DETECT |
| { |
| vp8_yv12_copy_frame_yonly_ptr(&cpi->last_frame_uf, cm->frame_to_show); |
| } |
| #endif |
| |
| // Was it better than the previous best? |
| if (filt_err < (best_err - Bias)) |
| { |
| best_err = filt_err; |
| filt_best = filt_high; |
| } |
| } |
| |
| // Half the step distance if the best filter value was the same as last time |
| if (filt_best == filt_mid) |
| { |
| filter_step = filter_step / 2; |
| filt_direction = 0; |
| } |
| else |
| { |
| filt_direction = (filt_best < filt_mid) ? -1 : 1; |
| filt_mid = filt_best; |
| } |
| } |
| |
| cm->filter_level = filt_best; |
| cpi->last_auto_filt_val = filt_best; |
| cpi->last_auto_filt_q = cm->base_qindex; |
| |
| cpi->last_auto_filter_prediction_error = cpi->prediction_error; |
| cpi->frames_since_auto_filter = 0; |
| } |