#include <errno.h>
#include <string.h>
#include <stddef.h>
#include "dict.h"
#include "feature_collector.h"
#include "feature_extractor.h"
#include "feature_name.h"
#include "mem.h"
#include "vif.h"
#include "vif_options.h"
#include "picture_copy.h"
typedef struct VifState {
size_t float_stride;
float *ref;
float *dist;
bool debug;
double vif_enhn_gain_limit;
double vif_kernelscale;
VmafDictionary *feature_name_dict;
} VifState;
static const VmafOption options[] = {
{
.name = "debug",
.help = "debug mode: enable additional output",
.offset = offsetof(VifState, debug),
.type = VMAF_OPT_TYPE_BOOL,
.default_val.b = false,
},
{
.name = "vif_enhn_gain_limit",
.alias = "egl",
.help = "enhancement gain imposed on vif, must be >= 1.0, "
"where 1.0 means the gain is completely disabled",
.offset = offsetof(VifState, vif_enhn_gain_limit),
.type = VMAF_OPT_TYPE_DOUBLE,
.default_val.d = DEFAULT_VIF_ENHN_GAIN_LIMIT,
.min = 1.0,
.max = DEFAULT_VIF_ENHN_GAIN_LIMIT,
.flags = VMAF_OPT_FLAG_FEATURE_PARAM,
},
{
.name = "vif_kernelscale",
.help = "scaling factor for the gaussian kernel (2.0 means "
"multiplying the standard deviation by 2 and enlarge "
"the kernel size accordingly",
.offset = offsetof(VifState, vif_kernelscale),
.type = VMAF_OPT_TYPE_DOUBLE,
.default_val.d = DEFAULT_VIF_KERNELSCALE,
.min = 0.1,
.max = 4.0,
.flags = VMAF_OPT_FLAG_FEATURE_PARAM,
},
{ 0 }
};
static int init(VmafFeatureExtractor *fex, enum VmafPixelFormat pix_fmt,
unsigned bpc, unsigned w, unsigned h)
{
(void)pix_fmt;
(void)bpc;
VifState *s = fex->priv;
s->float_stride = ALIGN_CEIL(w * sizeof(float));
s->ref = aligned_malloc(s->float_stride * h, 32);
if (!s->ref) goto fail;
s->dist = aligned_malloc(s->float_stride * h, 32);
if (!s->dist) goto fail;
s->feature_name_dict =
vmaf_feature_name_dict_from_provided_features(fex->provided_features,
fex->options, s);
if (!s->feature_name_dict) goto fail;
return 0;
fail:
if (s->ref) aligned_free(s->ref);
if (s->dist) aligned_free(s->dist);
vmaf_dictionary_free(&s->feature_name_dict);
return -ENOMEM;
}
static int extract(VmafFeatureExtractor *fex,
VmafPicture *ref_pic, VmafPicture *ref_pic_90,
VmafPicture *dist_pic, VmafPicture *dist_pic_90,
unsigned index, VmafFeatureCollector *feature_collector)
{
VifState *s = fex->priv;
int err = 0;
(void) ref_pic_90;
(void) dist_pic_90;
picture_copy(s->ref, s->float_stride, ref_pic, -128, ref_pic->bpc);
picture_copy(s->dist, s->float_stride, dist_pic, -128, dist_pic->bpc);
double score, score_num, score_den;
double scores[8];
err = compute_vif(s->ref, s->dist, ref_pic->w[0], ref_pic->h[0],
s->float_stride, s->float_stride,
&score, &score_num, &score_den, scores,
s->vif_enhn_gain_limit,
s->vif_kernelscale);
if (err) return err;
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "VMAF_feature_vif_scale0_score",
scores[0] / scores[1], index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "VMAF_feature_vif_scale1_score",
scores[2] / scores[3], index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "VMAF_feature_vif_scale2_score",
scores[4] / scores[5], index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "VMAF_feature_vif_scale3_score",
scores[6] / scores[7], index);
if (!s->debug) return err;
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "vif", score, index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "vif_num", score_num, index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "vif_den", score_den, index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "vif_num_scale0", scores[0], index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "vif_den_scale0", scores[1], index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "vif_num_scale1", scores[2], index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "vif_den_scale1", scores[3], index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "vif_num_scale2", scores[4], index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "vif_den_scale2", scores[5], index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "vif_num_scale3", scores[6], index);
err |= vmaf_feature_collector_append_with_dict(feature_collector,
s->feature_name_dict, "vif_den_scale3", scores[7], index);
return err;
}
static int close(VmafFeatureExtractor *fex)
{
VifState *s = fex->priv;
if (s->ref) aligned_free(s->ref);
if (s->dist) aligned_free(s->dist);
vmaf_dictionary_free(&s->feature_name_dict);
return 0;
}
static const char *provided_features[] = {
"VMAF_feature_vif_scale0_score", "VMAF_feature_vif_scale1_score",
"VMAF_feature_vif_scale2_score", "VMAF_feature_vif_scale3_score",
"vif", "vif_num", "vif_den", "vif_num_scale0", "vif_den_scale0",
"vif_num_scale1", "vif_den_scale1", "vif_num_scale2", "vif_den_scale2",
"vif_num_scale3", "vif_den_scale3",
NULL
};
VmafFeatureExtractor vmaf_fex_float_vif = {
.name = "float_vif",
.init = init,
.extract = extract,
.options = options,
.close = close,
.priv_size = sizeof(VifState),
.provided_features = provided_features,
};