Blame - test/convolution-operator-tester.h - platform/external/XNNPACK

2019-11-19 12:36:47 -0800

[diff] [blame]

647

ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

648

xnn_operator_t convolution_op = nullptr;

649

650

ASSERT_EQ(xnn_status_success,

651

xnn_create_convolution2d_nhwc_q8(

Marat Dukhan

2019-10-24 12:46:13 -0700

[diff] [blame]

652

padding_tf_same() ? 0 : padding_top(), padding_tf_same() ? 0 : padding_right(),

653

padding_tf_same() ? 0 : padding_bottom(), padding_tf_same() ? 0 : padding_left(),

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

654

kernel_height(), kernel_width(),

655

subsampling_height(), subsampling_width(),

656

dilation_height(), dilation_width(),

657

groups(), group_input_channels(), group_output_channels(),

658

input_pixel_stride(), output_pixel_stride(),

659

input_zero_point, 1.0f /* input scale */,

660

kernel_zero_point, 1.0f /* kernel scale */,

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

661

kernel.data(), has_bias() ? bias.data() : nullptr,

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

662

output_zero_point, output_scale, qmin(), qmax(),

Marat Dukhan

2019-10-24 12:46:13 -0700

[diff] [blame]

663

(depthwise_layout() ? XNN_FLAG_DEPTHWISE_CONVOLUTION : 0) | (padding_tf_same() ? XNN_FLAG_TENSORFLOW_SAME_PADDING : 0),

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

664

&convolution_op));

665

666

// Smart pointer to automatically delete convolution_op.

667

std::unique_ptr<xnn_operator, decltype(&xnn_delete_operator)> auto_convolution_op(convolution_op, xnn_delete_operator);

668

669

ASSERT_EQ(xnn_status_success,

670

xnn_setup_convolution2d_nhwc_q8(

671

convolution_op,

672

batch_size(), input_height(), input_width(),

673

input.data(), output.data(),

674

nullptr /* thread pool */));

675

676

ASSERT_EQ(xnn_status_success,

677

xnn_run_operator(convolution_op, nullptr /* thread pool */));

678

679

// Verify results.

680

for (size_t i = 0; i < batch_size(); i++) {

681

for (size_t y = 0; y < output_height(); y++) {

682

for (size_t x = 0; x < output_width(); x++) {

683

for (size_t g = 0; g < groups(); g++) {

684

for (size_t c = 0; c < group_output_channels(); c++) {

685

ASSERT_LE(int32_t(output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c]), int32_t(qmax()))

686

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

687

ASSERT_GE(int32_t(output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c]), int32_t(qmin()))

688

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

689

ASSERT_NEAR(

690

output_ref[(((i * output_height() + y) * output_width() + x) * groups() + g) * group_output_channels() + c],

691

double(output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c]) - double(output_zero_point),

692

0.9)

693

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

}

}

}

}

}

}

}

Marat Dukhan

2019-11-18 09:25:38 -0800

[diff] [blame]

702

void TestNHWCxF32() const {

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

703

std::random_device random_device;

704

auto rng = std::mt19937(random_device());

705

auto f32rng = std::bind(std::uniform_real_distribution<float>(0.1f, 1.0f), rng);

706

707

std::vector<float> input(XNN_EXTRA_BYTES / sizeof(float) +

708

batch_size() * ((input_height() * input_width() - 1) * input_pixel_stride() + groups() * group_input_channels()));

709

std::vector<float> kernel(groups() * group_output_channels() * kernel_height() * kernel_width() * group_input_channels());

710

std::vector<float> bias(groups() * group_output_channels());

711

std::vector<float> output(batch_size() * ((output_height() * output_width() - 1) * output_pixel_stride() + groups() * group_output_channels()));

712

std::vector<float> output_ref(batch_size() * output_height() * output_width() * groups() * group_output_channels());

713

714

for (size_t iteration = 0; iteration < iterations(); iteration++) {

715

std::generate(input.begin(), input.end(), std::ref(f32rng));

716

std::generate(kernel.begin(), kernel.end(), std::ref(f32rng));

717

std::generate(bias.begin(), bias.end(), std::ref(f32rng));

718

std::fill(output.begin(), output.end(), nanf(""));

719

720

// Compute reference results, without clamping.

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

721

if (has_bias()) {

722

for (size_t i = 0; i < batch_size(); i++) {

723

for (size_t oy = 0; oy < output_height(); oy++) {

724

for (size_t ox = 0; ox < output_width(); ox++) {

725

for (size_t g = 0; g < groups(); g++) {

726

for (size_t oc = 0; oc < group_output_channels(); oc++) {

727

output_ref[(((i * output_height() + oy) * output_width() + ox) * groups() + g) * group_output_channels() + oc] =

728

bias[g * group_output_channels() + oc];

729

}

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

}

}

}

}

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

734

} else {

735

std::fill(output_ref.begin(), output_ref.end(), 0.0f);

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

736

}

737

if (depthwise_layout()) {

738

ASSERT_EQ(group_input_channels(), 1);

739

740

for (size_t i = 0; i < batch_size(); i++) {

741

for (size_t oy = 0; oy < output_height(); oy++) {

742

for (size_t ox = 0; ox < output_width(); ox++) {

743

for (size_t ky = 0; ky < kernel_height(); ky++) {

744

const size_t iy = oy * subsampling_height() + ky * dilation_height() - padding_top();

745

if (iy < input_height()) {

746

for (size_t kx = 0; kx < kernel_width(); kx++) {

747

const size_t ix = ox * subsampling_width() + kx * dilation_width() - padding_left();

748

if (ix < input_width()) {

749

for (size_t g = 0; g < groups(); g++) {

750

for (size_t oc = 0; oc < group_output_channels(); oc++) {

751

output_ref[(((i * output_height() + oy) * output_width() + ox) * groups() + g) * group_output_channels() + oc] +=

752

input[((i * input_height() + iy) * input_width() + ix) * input_pixel_stride() + g] *

753

kernel[((ky * kernel_width() + kx) * groups() + g) * group_output_channels() + oc];

}

}

}

}

}

}

}

}

}

} else {

for (size_t i = 0; i < batch_size(); i++) {

765

for (size_t oy = 0; oy < output_height(); oy++) {

766

for (size_t ox = 0; ox < output_width(); ox++) {

767

for (size_t ky = 0; ky < kernel_height(); ky++) {

768

const size_t iy = oy * subsampling_height() + ky * dilation_height() - padding_top();

769

if (iy < input_height()) {

770

for (size_t kx = 0; kx < kernel_width(); kx++) {

771

const size_t ix = ox * subsampling_width() + kx * dilation_width() - padding_left();

772

if (ix < input_width()) {

773

for (size_t g = 0; g < groups(); g++) {

774

for (size_t oc = 0; oc < group_output_channels(); oc++) {

775

for (size_t ic = 0; ic < group_input_channels(); ic++) {

776

output_ref[(((i * output_height() + oy) * output_width() + ox) * groups() + g) * group_output_channels() + oc] +=

777

input[((i * input_height() + iy) * input_width() + ix) * input_pixel_stride() + g * group_input_channels() + ic] *

778

kernel[(((g * group_output_channels() + oc) * kernel_height() + ky) * kernel_width() + kx) * group_input_channels() + ic];

}

}

}

}

}

}

}

}

}

}

}

// Compute clamping parameters.

792

const float accumulated_min = *std::min_element(output_ref.cbegin(), output_ref.cend());

793

const float accumulated_max = *std::max_element(output_ref.cbegin(), output_ref.cend());

794

795

const float output_min = accumulated_min + (accumulated_max - accumulated_min) / 255.0f * float(qmin());

796

const float output_max = accumulated_max - (accumulated_max - accumulated_min) / 255.0f * float(255 - qmax());

797

798

// Clamp reference results.

799

for (float& value : output_ref) {

800

value = std::max(std::min(value, output_max), output_min);

801

}

802

803

// Create, setup, run, and destroy Convolution operator.

Marat Dukhan

2019-11-19 12:36:47 -0800

[diff] [blame]

804

ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

805

xnn_operator_t convolution_op = nullptr;

806

807

ASSERT_EQ(xnn_status_success,

808

xnn_create_convolution2d_nhwc_f32(

Marat Dukhan

2019-10-24 12:46:13 -0700

[diff] [blame]

809

padding_tf_same() ? 0 : padding_top(), padding_tf_same() ? 0 : padding_right(),

810

padding_tf_same() ? 0 : padding_bottom(), padding_tf_same() ? 0 : padding_left(),

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

811

kernel_height(), kernel_width(),

812

subsampling_height(), subsampling_width(),

813

dilation_height(), dilation_width(),

814

groups(), group_input_channels(), group_output_channels(),

815

input_pixel_stride(), output_pixel_stride(),

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

816

kernel.data(), has_bias() ? bias.data() : nullptr,

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

817

output_min, output_max,

Marat Dukhan

2019-10-24 12:46:13 -0700

[diff] [blame]

818

(depthwise_layout() ? XNN_FLAG_DEPTHWISE_CONVOLUTION : 0) | (padding_tf_same() ? XNN_FLAG_TENSORFLOW_SAME_PADDING : 0),

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

819

&convolution_op));

820

821

// Smart pointer to automatically delete convolution_op.

822

std::unique_ptr<xnn_operator, decltype(&xnn_delete_operator)> auto_convolution_op(convolution_op, xnn_delete_operator);

823

824

ASSERT_EQ(xnn_status_success,

825

xnn_setup_convolution2d_nhwc_f32(

826

convolution_op,

827

batch_size(), input_height(), input_width(),

828

input.data(), output.data(),

829

nullptr /* thread pool */));

830

831

ASSERT_EQ(xnn_status_success,

832

xnn_run_operator(convolution_op, nullptr /* thread pool */));

833

834

// Verify results.

835

for (size_t i = 0; i < batch_size(); i++) {

836

for (size_t y = 0; y < output_height(); y++) {

837

for (size_t x = 0; x < output_width(); x++) {

838

for (size_t g = 0; g < groups(); g++) {

839

for (size_t c = 0; c < group_output_channels(); c++) {

840

ASSERT_GE(output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c], output_min)

841

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

842

ASSERT_LE(output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c], output_max)

843

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

844

ASSERT_NEAR(

845

output_ref[(((i * output_height() + y) * output_width() + x) * groups() + g) * group_output_channels() + c],

846

output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c],

847

1.0e-4 * std::abs(output_ref[(((i * output_height() + y) * output_width() + x) * groups() + g) * group_output_channels() + c]))

848

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

}

}

}

}

}

}

}

Marat Dukhan

2019-11-18 09:25:38 -0800

[diff] [blame]

857

void TestNCHWxF32() const {

858

ASSERT_FALSE(depthwise_layout());

859

860

std::random_device random_device;

861

auto rng = std::mt19937(random_device());

862

auto f32rng = std::bind(std::uniform_real_distribution<float>(0.1f, 1.0f), rng);

863

auto prng = std::bind(std::uniform_real_distribution<float>(), rng);

864

865

std::vector<float> input(XNN_EXTRA_BYTES / sizeof(float) +

866

batch_size() * input_batch_stride() + groups() * group_input_channels() * input_height() * input_width());

867

std::vector<float> kernel(

868

groups() * group_output_channels() * kernel_height() * kernel_width() * group_input_channels());

869

std::vector<float> bias(groups() * group_output_channels());

870

std::vector<float> output(

871

batch_size() * output_batch_stride() + groups() * group_output_channels() * output_height() * output_width());

872

std::vector<float> output_ref(batch_size() * groups() * group_output_channels() * output_height() * output_width());

873

874

for (size_t iteration = 0; iteration < iterations(); iteration++) {

875

std::generate(input.begin(), input.end(), std::ref(f32rng));

876

std::generate(kernel.begin(), kernel.end(), std::ref(f32rng));

877

for (float& k : kernel) {

878

if (prng() <= sparsity()) {

k = 0.0f;

}

}

std::generate(bias.begin(), bias.end(), std::ref(f32rng));

883

std::fill(output.begin(), output.end(), nanf(""));

884

885

// Compute reference results, without clamping.

886

if (has_bias()) {

887

for (size_t i = 0; i < batch_size(); i++) {

888

for (size_t oy = 0; oy < output_height(); oy++) {

889

for (size_t ox = 0; ox < output_width(); ox++) {

890

for (size_t g = 0; g < groups(); g++) {

891

for (size_t oc = 0; oc < group_output_channels(); oc++) {

892

output_ref[(((i * groups() + g) * group_output_channels() + oc) * output_height() + oy) * output_width() + ox] =

893

bias[g * group_output_channels() + oc];

}

}

}

}

}

} else {

std::fill(output_ref.begin(), output_ref.end(), 0.0f);

901

}

902

if (force_nhwc_input()) {

903

for (size_t i = 0; i < batch_size(); i++) {

904

for (size_t oy = 0; oy < output_height(); oy++) {

905

for (size_t ox = 0; ox < output_width(); ox++) {

906

for (size_t ky = 0; ky < kernel_height(); ky++) {

907

const size_t iy = oy * subsampling_height() + ky * dilation_height() - padding_top();

908

if (iy < input_height()) {

909

for (size_t kx = 0; kx < kernel_width(); kx++) {

910

const size_t ix = ox * subsampling_width() + kx * dilation_width() - padding_left();

911

if (ix < input_width()) {

912

for (size_t g = 0; g < groups(); g++) {

913

for (size_t oc = 0; oc < group_output_channels(); oc++) {

914

for (size_t ic = 0; ic < group_input_channels(); ic++) {

915

output_ref[(((i * groups() + g) * group_output_channels() + oc) * output_height() + oy) * output_width() + ox] +=

916

input[((((i * input_height() + iy) * input_width() + ix) * groups() + g) * group_input_channels() + ic)] *

917

kernel[(((g * group_output_channels() + oc) * kernel_height() + ky) * kernel_width() + kx) * group_input_channels() + ic];

}

}

}

}

}

}

}

}

}

}

} else {

for (size_t i = 0; i < batch_size(); i++) {

930

for (size_t oy = 0; oy < output_height(); oy++) {

931

for (size_t ox = 0; ox < output_width(); ox++) {

932

for (size_t ky = 0; ky < kernel_height(); ky++) {

933

const size_t iy = oy * subsampling_height() + ky * dilation_height() - padding_top();

934

if (iy < input_height()) {

935

for (size_t kx = 0; kx < kernel_width(); kx++) {

936

const size_t ix = ox * subsampling_width() + kx * dilation_width() - padding_left();

937

if (ix < input_width()) {

938

for (size_t g = 0; g < groups(); g++) {

939

for (size_t oc = 0; oc < group_output_channels(); oc++) {

940

for (size_t ic = 0; ic < group_input_channels(); ic++) {

941

output_ref[(((i * groups() + g) * group_output_channels() + oc) * output_height() + oy) * output_width() + ox] +=

942

input[i * input_batch_stride() +

943

((g * group_input_channels() + ic) * input_height() + iy) * input_width() + ix] *

944

kernel[(((g * group_output_channels() + oc) * kernel_height() + ky) * kernel_width() + kx) * group_input_channels() + ic];

}

}

}

}

}

}

}

}

}

}

}

// Compute clamping parameters.

958

const float accumulated_min = *std::min_element(output_ref.cbegin(), output_ref.cend());

959

const float accumulated_max = *std::max_element(output_ref.cbegin(), output_ref.cend());

960

Marat Dukhan

869c62d

2020-04-09 17:17:55 -0700

[diff] [blame]

961

const float output_min = qmin() == 0 ? -std::numeric_limits<float>::infinity() :

962

accumulated_min + (accumulated_max - accumulated_min) / 255.0f * float(qmin());

963

const float output_max = qmax() == 255 ? std::numeric_limits<float>::infinity() :

964

accumulated_max - (accumulated_max - accumulated_min) / 255.0f * float(255 - qmax());

Marat Dukhan

2019-11-18 09:25:38 -0800

[diff] [blame]

965

966

// Clamp reference results.

967

for (float& value : output_ref) {

968

value = std::max(std::min(value, output_max), output_min);

969

}

970

971

// Create, setup, run, and destroy Convolution operator.

Marat Dukhan

2019-11-19 12:36:47 -0800

[diff] [blame]

972

ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));

Marat Dukhan

2019-11-18 09:25:38 -0800

[diff] [blame]

973

xnn_operator_t convolution_op = nullptr;

974

975

xnn_status status = xnn_create_convolution2d_nchw_f32(

976

padding_top(), padding_right(), padding_bottom(), padding_left(),

977

kernel_height(), kernel_width(),

978

subsampling_height(), subsampling_width(),

979

dilation_height(), dilation_width(),

980

groups(), group_input_channels(), group_output_channels(),

981

kernel.data(), has_bias() ? bias.data() : nullptr,

982

output_min, output_max,

983

(depthwise_layout() ? XNN_FLAG_DEPTHWISE_CONVOLUTION : 0) | (force_nhwc_input() ? XNN_FLAG_INPUT_NHWC : 0),

984

&convolution_op);

985

if (status == xnn_status_unsupported_parameter) {

986

GTEST_SKIP();

987

}

988

ASSERT_EQ(xnn_status_success, status);

989

990

// Smart pointer to automatically delete convolution_op.

991

std::unique_ptr<xnn_operator, decltype(&xnn_delete_operator)> auto_convolution_op(convolution_op, xnn_delete_operator);

992

993

ASSERT_EQ(xnn_status_success,

994

xnn_setup_convolution2d_nchw_f32(

995

convolution_op,

996

batch_size(), input_batch_stride(), output_batch_stride(), input_height(), input_width(),

997

input.data(), output.data(),

998

nullptr /* thread pool */));

999

1000

ASSERT_EQ(xnn_status_success,

1001

xnn_run_operator(convolution_op, nullptr /* thread pool */));

1002

1003

// Verify results.

1004

for (size_t i = 0; i < batch_size(); i++) {

1005

for (size_t y = 0; y < output_height(); y++) {

1006

for (size_t x = 0; x < output_width(); x++) {

1007

for (size_t g = 0; g < groups(); g++) {

1008

for (size_t c = 0; c < group_output_channels(); c++) {

1009

ASSERT_GE(output[i * output_batch_stride() + ((g * group_output_channels() + c) * output_height() + y) * output_width() + x], output_min)

1010

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c << ", image = " << i;

1011

ASSERT_LE(output[i * output_batch_stride() + ((g * group_output_channels() + c) * output_height() + y) * output_width() + x], output_max)

1012

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c << ", image = " << i;

1013

ASSERT_NEAR(

1014

output_ref[(((i * groups() + g) * group_output_channels() + c) * output_height() + y) * output_width() + x],

1015

output[i * output_batch_stride() + ((g * group_output_channels() + c) * output_height() + y) * output_width() + x],

1016

1.0e-4 * std::abs(output_ref[(((i * groups() + g) * group_output_channels() + c) * output_height() + y) * output_width() + x]))

1017

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c << ", image = " << i;

}

}

}

}

}

}

}

void TestSetupNHWCxQ8() const {

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1027

ASSERT_FALSE(depthwise_layout());

1028

1029

std::random_device random_device;

1030

auto rng = std::mt19937(random_device());

1031

auto s32rng = std::bind(std::uniform_int_distribution<int32_t>(-10000, 10000), rng);

Marat Dukhan

5ce30d9

2020-04-14 03:31:26 -0700

[diff] [blame^]

1032

auto u8rng = std::bind(std::uniform_int_distribution<uint32_t>(0, std::numeric_limits<uint8_t>::max()), rng);

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1033

1034

std::vector<uint8_t> input(XNN_EXTRA_BYTES / sizeof(uint8_t) + std::max(

1035

batch_size() * ((input_height() * input_width() - 1) * input_pixel_stride() + groups() * group_input_channels()),

1036

next_batch_size() * ((next_input_height() * next_input_width() - 1) * input_pixel_stride() + groups() * group_input_channels())) + 8);

1037

std::vector<uint8_t> kernel(groups() * group_output_channels() * kernel_height() * kernel_width() * group_input_channels());

1038

std::vector<int32_t> bias(groups() * group_output_channels());

1039

std::vector<uint8_t> output(std::max(

1040

batch_size() * ((output_height() * output_width() - 1) * output_pixel_stride() + groups() * group_output_channels()),

1041

next_batch_size() * ((next_output_height() * next_output_width() - 1) * output_pixel_stride() + groups() * group_output_channels())));

1042

std::vector<int32_t> accumulators(batch_size() * output_height() * output_width() * groups() * group_output_channels());

1043

std::vector<double> output_ref(batch_size() * output_height() * output_width() * groups() * group_output_channels());

1044

std::vector<int32_t> next_accumulators(next_batch_size() * next_output_height() * next_output_width() * groups() * group_output_channels());

1045

std::vector<double> next_output_ref(next_batch_size() * next_output_height() * next_output_width() * groups() * group_output_channels());

1046

1047

const uint8_t input_zero_point = 127;

1048

const uint8_t kernel_zero_point = 127;

1049

1050

for (size_t iteration = 0; iteration < iterations(); iteration++) {

1051

std::generate(input.begin(), input.end(), std::ref(u8rng));

1052

std::generate(kernel.begin(), kernel.end(), std::ref(u8rng));

1053

std::generate(bias.begin(), bias.end(), std::ref(s32rng));

1054

std::fill(output.begin(), output.end(), 0xA5);

1055

1056

// Compute reference results, without renormalization.

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

1057

if (has_bias()) {

1058

for (size_t i = 0; i < batch_size(); i++) {

1059

for (size_t oy = 0; oy < output_height(); oy++) {

1060

for (size_t ox = 0; ox < output_width(); ox++) {

1061

for (size_t g = 0; g < groups(); g++) {

1062

for (size_t oc = 0; oc < group_output_channels(); oc++) {

1063

accumulators[(((i * output_height() + oy) * output_width() + ox) * groups() + g) * group_output_channels() + oc] =

1064

bias[g * group_output_channels() + oc];

1065

}

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

}

}

}

}

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

1070

} else {

1071

std::fill(accumulators.begin(), accumulators.end(), 0);

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1072

}

1073

for (size_t i = 0; i < batch_size(); i++) {

1074

for (size_t oy = 0; oy < output_height(); oy++) {

1075

for (size_t ox = 0; ox < output_width(); ox++) {

1076

for (size_t ky = 0; ky < kernel_height(); ky++) {

1077

const size_t iy = oy * subsampling_height() + ky * dilation_height() - padding_top();

1078

if (iy < input_height()) {

1079

for (size_t kx = 0; kx < kernel_width(); kx++) {

1080

const size_t ix = ox * subsampling_width() + kx * dilation_width() - padding_left();

1081

if (ix < input_width()) {

1082

for (size_t g = 0; g < groups(); g++) {

1083

for (size_t oc = 0; oc < group_output_channels(); oc++) {

1084

for (size_t ic = 0; ic < group_input_channels(); ic++) {

1085

accumulators[(((i * output_height() + oy) * output_width() + ox) * groups() + g) * group_output_channels() + oc] +=

1086

(int32_t(input[((i * input_height() + iy) * input_width() + ix) * input_pixel_stride() + g * group_input_channels() + ic]) - int32_t(input_zero_point)) *

1087

(int32_t(kernel[(((g * group_output_channels() + oc) * kernel_height() + ky) * kernel_width() + kx) * group_input_channels() + ic]) - int32_t(kernel_zero_point));

}

}

}

}

}

}

}

}

}

}

// Compute renormalization parameters.

1100

const int32_t accumulated_min = *std::min_element(accumulators.cbegin(), accumulators.cend());

1101

const int32_t accumulated_max = *std::max_element(accumulators.cbegin(), accumulators.cend());

1102

1103

const double output_scale = double(uint32_t(accumulated_max - accumulated_min)) / 255.0;

1104

const uint8_t output_zero_point = uint8_t(std::max(std::min(

1105

lrint(127.5 - 0.5 * double(accumulated_min + accumulated_max) / output_scale),

1106

long(std::numeric_limits<uint8_t>::max())), long(std::numeric_limits<uint8_t>::min())));

1107

1108

// Renormalize reference results.

1109

std::transform(accumulators.cbegin(), accumulators.cend(), output_ref.begin(),

1110

[this, output_scale, output_zero_point](int32_t x) -> double {

1111

return std::max<double>(std::min<double>(double(x) / output_scale, double(qmax()) - output_zero_point), double(qmin()) - output_zero_point);

1112

});

1113

1114

// Create, setup, and run Convolution operator once.

Marat Dukhan

2019-11-19 12:36:47 -0800

[diff] [blame]

1115

ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1116

xnn_operator_t convolution_op = nullptr;

1117

1118

ASSERT_EQ(xnn_status_success,

1119

xnn_create_convolution2d_nhwc_q8(

1120

padding_top(), padding_right(), padding_bottom(), padding_left(),

1121

kernel_height(), kernel_width(),

1122

subsampling_height(), subsampling_width(),

1123

dilation_height(), dilation_width(),

1124

groups(), group_input_channels(), group_output_channels(),

1125

input_pixel_stride(), output_pixel_stride(),

1126

input_zero_point, 1.0f /* input scale */,

1127

kernel_zero_point, 1.0f /* kernel scale */,

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

1128

kernel.data(), has_bias() ? bias.data() : nullptr,

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1129

output_zero_point, output_scale, qmin(), qmax(),

1130

0, &convolution_op));

1131

1132

// Smart pointer to automatically delete convolution_op.

1133

std::unique_ptr<xnn_operator, decltype(&xnn_delete_operator)> auto_convolution_op(convolution_op, xnn_delete_operator);

1134

1135

ASSERT_EQ(xnn_status_success,

1136

xnn_setup_convolution2d_nhwc_q8(

1137

convolution_op,

1138

batch_size(), input_height(), input_width(),

1139

input.data(), output.data(),

1140

nullptr /* thread pool */));

1141

1142

ASSERT_EQ(xnn_status_success,

1143

xnn_run_operator(convolution_op, nullptr /* thread pool */));

1144

1145

// Verify results of the first run.

1146

for (size_t i = 0; i < batch_size(); i++) {

1147

for (size_t y = 0; y < output_height(); y++) {

1148

for (size_t x = 0; x < output_width(); x++) {

1149

for (size_t g = 0; g < groups(); g++) {

1150

for (size_t c = 0; c < group_output_channels(); c++) {

1151

ASSERT_LE(int32_t(output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c]), int32_t(qmax()))

1152

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

1153

ASSERT_GE(int32_t(output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c]), int32_t(qmin()))

1154

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

1155

ASSERT_NEAR(

1156

output_ref[(((i * output_height() + y) * output_width() + x) * groups() + g) * group_output_channels() + c],

1157

double(output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c]) - double(output_zero_point),

1158

0.9)

1159

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

}

}

}

}

}

// Re-generate data for the second run.

1167

std::generate(input.begin(), input.end(), std::ref(u8rng));

1168

std::fill(output.begin(), output.end(), 0xA5);

1169

1170

// Compute reference results for the second run, including renormalization.

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

1171

if (has_bias()) {

1172

for (size_t i = 0; i < next_batch_size(); i++) {

1173

for (size_t oy = 0; oy < next_output_height(); oy++) {

1174

for (size_t ox = 0; ox < next_output_width(); ox++) {

1175

for (size_t g = 0; g < groups(); g++) {

1176

for (size_t oc = 0; oc < group_output_channels(); oc++) {

1177

next_accumulators[(((i * next_output_height() + oy) * next_output_width() + ox) * groups() + g) * group_output_channels() + oc] =

1178

bias[g * group_output_channels() + oc];

1179

}

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

}

}

}

}

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

1184

} else {

1185

std::fill(next_accumulators.begin(), next_accumulators.end(), 0);

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1186

}

1187

for (size_t i = 0; i < next_batch_size(); i++) {

1188

for (size_t oy = 0; oy < next_output_height(); oy++) {

1189

for (size_t ox = 0; ox < next_output_width(); ox++) {

1190

for (size_t ky = 0; ky < kernel_height(); ky++) {

1191

const size_t iy = oy * subsampling_height() + ky * dilation_height() - padding_top();

1192

if (iy < next_input_height()) {

1193

for (size_t kx = 0; kx < kernel_width(); kx++) {

1194

const size_t ix = ox * subsampling_width() + kx * dilation_width() - padding_left();

1195

if (ix < next_input_width()) {

1196

for (size_t g = 0; g < groups(); g++) {

1197

for (size_t oc = 0; oc < group_output_channels(); oc++) {

1198

for (size_t ic = 0; ic < group_input_channels(); ic++) {

1199

next_accumulators[(((i * next_output_height() + oy) * next_output_width() + ox) * groups() + g) * group_output_channels() + oc] +=

1200

(int32_t(input[((i * next_input_height() + iy) * next_input_width() + ix) * input_pixel_stride() + g * group_input_channels() + ic]) - int32_t(input_zero_point)) *

1201

(int32_t(kernel[(((g * group_output_channels() + oc) * kernel_height() + ky) * kernel_width() + kx) * group_input_channels() + ic]) - int32_t(kernel_zero_point));

}

}

}

}

}

}

}

}

}

}

std::transform(next_accumulators.cbegin(), next_accumulators.cend(), next_output_ref.begin(),

1213

[this, output_scale, output_zero_point](int32_t x) -> double {

1214

return std::max<double>(std::min<double>(double(x) / output_scale, double(qmax()) - output_zero_point), double(qmin()) - output_zero_point);

1215

});

1216

1217

// Setup and run Convolution operator the second time, and destroy the operator.

1218

ASSERT_EQ(xnn_status_success,

1219

xnn_setup_convolution2d_nhwc_q8(

1220

convolution_op,

1221

next_batch_size(), next_input_height(), next_input_width(),

1222

input.data(), output.data(),

1223

nullptr /* thread pool */));

1224

1225

ASSERT_EQ(xnn_status_success,

1226

xnn_run_operator(convolution_op, nullptr /* thread pool */));

1227

1228

// Verify results of the second run.

1229

for (size_t i = 0; i < next_batch_size(); i++) {

1230

for (size_t y = 0; y < next_output_height(); y++) {

1231

for (size_t x = 0; x < next_output_width(); x++) {

1232

for (size_t g = 0; g < groups(); g++) {

1233

for (size_t c = 0; c < group_output_channels(); c++) {

1234

ASSERT_LE(int32_t(output[((i * next_output_height() + y) * next_output_width() + x) * output_pixel_stride() + g * group_output_channels() + c]), int32_t(qmax()))

1235

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

1236

ASSERT_GE(int32_t(output[((i * next_output_height() + y) * next_output_width() + x) * output_pixel_stride() + g * group_output_channels() + c]), int32_t(qmin()))

1237

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

1238

ASSERT_NEAR(

1239

next_output_ref[(((i * next_output_height() + y) * next_output_width() + x) * groups() + g) * group_output_channels() + c],

1240

double(output[((i * next_output_height() + y) * next_output_width() + x) * output_pixel_stride() + g * group_output_channels() + c]) - double(output_zero_point),

1241

0.9)

1242

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

}

}

}

}

}

}

}

Marat Dukhan

2019-11-18 09:25:38 -0800

[diff] [blame]

1251

void TestSetupNHWCxF32() const {

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1252

ASSERT_FALSE(depthwise_layout());

1253

1254

std::random_device random_device;

1255

auto rng = std::mt19937(random_device());

1256

auto f32rng = std::bind(std::uniform_real_distribution<float>(0.1f, 1.0f), rng);

1257

1258

std::vector<float> input(XNN_EXTRA_BYTES / sizeof(float) + std::max(

1259

batch_size() * ((input_height() * input_width() - 1) * input_pixel_stride() + groups() * group_input_channels()),

1260

next_batch_size() * ((next_input_height() * next_input_width() - 1) * input_pixel_stride() + groups() * group_input_channels())));

1261

std::vector<float> kernel(groups() * group_output_channels() * kernel_height() * kernel_width() * group_input_channels());

1262

std::vector<float> bias(groups() * group_output_channels());

1263

std::vector<float> output(std::max(

1264

batch_size() * ((output_height() * output_width() - 1) * output_pixel_stride() + groups() * group_output_channels()),

1265

next_batch_size() * ((next_output_height() * next_output_width() - 1) * output_pixel_stride() + groups() * group_output_channels())));

1266

std::vector<float> output_ref(batch_size() * output_height() * output_width() * groups() * group_output_channels());

1267

std::vector<float> next_output_ref(next_batch_size() * next_output_height() * next_output_width() * groups() * group_output_channels());

1268

1269

for (size_t iteration = 0; iteration < iterations(); iteration++) {

1270

std::generate(input.begin(), input.end(), std::ref(f32rng));

1271

std::generate(kernel.begin(), kernel.end(), std::ref(f32rng));

1272

std::generate(bias.begin(), bias.end(), std::ref(f32rng));

1273

std::fill(output.begin(), output.end(), nanf(""));

1274

1275

// Compute reference results, without clamping.

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

1276

if (has_bias()) {

1277

for (size_t i = 0; i < batch_size(); i++) {

1278

for (size_t oy = 0; oy < output_height(); oy++) {

1279

for (size_t ox = 0; ox < output_width(); ox++) {

1280

for (size_t g = 0; g < groups(); g++) {

1281

for (size_t oc = 0; oc < group_output_channels(); oc++) {

1282

output_ref[(((i * output_height() + oy) * output_width() + ox) * groups() + g) * group_output_channels() + oc] =

1283

bias[g * group_output_channels() + oc];

1284

}

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

}

}

}

}

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

1289

} else {

1290

std::fill(output_ref.begin(), output_ref.end(), 0.0f);

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1291

}

1292

for (size_t i = 0; i < batch_size(); i++) {

1293

for (size_t oy = 0; oy < output_height(); oy++) {

1294

for (size_t ox = 0; ox < output_width(); ox++) {

1295

for (size_t ky = 0; ky < kernel_height(); ky++) {

1296

const size_t iy = oy * subsampling_height() + ky * dilation_height() - padding_top();

1297

if (iy < input_height()) {

1298

for (size_t kx = 0; kx < kernel_width(); kx++) {

1299

const size_t ix = ox * subsampling_width() + kx * dilation_width() - padding_left();

1300

if (ix < input_width()) {

1301

for (size_t g = 0; g < groups(); g++) {

1302

for (size_t oc = 0; oc < group_output_channels(); oc++) {

1303

for (size_t ic = 0; ic < group_input_channels(); ic++) {

1304

output_ref[(((i * output_height() + oy) * output_width() + ox) * groups() + g) * group_output_channels() + oc] +=

1305

input[((i * input_height() + iy) * input_width() + ix) * input_pixel_stride() + g * group_input_channels() + ic] *

1306

kernel[(((g * group_output_channels() + oc) * kernel_height() + ky) * kernel_width() + kx) * group_input_channels() + ic];

}

}

}

}

}

}

}

}

}

}

// Compute clamping parameters.

1319

const float accumulated_min = *std::min_element(output_ref.cbegin(), output_ref.cend());

1320

const float accumulated_max = *std::max_element(output_ref.cbegin(), output_ref.cend());

1321

1322

const float output_min = accumulated_min + (accumulated_max - accumulated_min) / 255.0f * float(qmin());

1323

const float output_max = accumulated_max - (accumulated_max - accumulated_min) / 255.0f * float(255 - qmax());

1324

1325

// Clamp reference results.

1326

for (float& value : output_ref) {

1327

value = std::max(std::min(value, output_max), output_min);

1328

}

1329

1330

// Create, setup, and run Convolution operator once.

Marat Dukhan

2019-11-19 12:36:47 -0800

[diff] [blame]

1331

ASSERT_EQ(xnn_status_success, xnn_initialize(nullptr /* allocator */));

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1332

xnn_operator_t convolution_op = nullptr;

1333

1334

ASSERT_EQ(xnn_status_success,

1335

xnn_create_convolution2d_nhwc_f32(

1336

padding_top(), padding_right(), padding_bottom(), padding_left(),

1337

kernel_height(), kernel_width(),

1338

subsampling_height(), subsampling_width(),

1339

dilation_height(), dilation_width(),

1340

groups(), group_input_channels(), group_output_channels(),

1341

input_pixel_stride(), output_pixel_stride(),

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

1342

kernel.data(), has_bias() ? bias.data() : nullptr,

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1343

output_min, output_max,

1344

0, &convolution_op));

1345

1346

// Smart pointer to automatically delete convolution_op.

1347

std::unique_ptr<xnn_operator, decltype(&xnn_delete_operator)> auto_convolution_op(convolution_op, xnn_delete_operator);

1348

1349

ASSERT_EQ(xnn_status_success,

1350

xnn_setup_convolution2d_nhwc_f32(

1351

convolution_op,

1352

batch_size(), input_height(), input_width(),

1353

input.data(), output.data(),

1354

nullptr /* thread pool */));

1355

1356

ASSERT_EQ(xnn_status_success,

1357

xnn_run_operator(convolution_op, nullptr /* thread pool */));

1358

1359

// Verify results of the first run.

1360

for (size_t i = 0; i < batch_size(); i++) {

1361

for (size_t y = 0; y < output_height(); y++) {

1362

for (size_t x = 0; x < output_width(); x++) {

1363

for (size_t g = 0; g < groups(); g++) {

1364

for (size_t c = 0; c < group_output_channels(); c++) {

1365

ASSERT_GE(output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c], output_min)

1366

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

1367

ASSERT_LE(output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c], output_max)

1368

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

1369

ASSERT_NEAR(

1370

output_ref[(((i * output_height() + y) * output_width() + x) * groups() + g) * group_output_channels() + c],

1371

output[((i * output_height() + y) * output_width() + x) * output_pixel_stride() + g * group_output_channels() + c],

1372

1.0e-4 * std::abs(output_ref[(((i * output_height() + y) * output_width() + x) * groups() + g) * group_output_channels() + c]))

1373

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

}

}

}

}

}

// Re-generate data for the second run.

1381

std::generate(input.begin(), input.end(), std::ref(f32rng));

1382

std::fill(output.begin(), output.end(), nanf(""));

1383

1384

// Compute reference results for the second run, including clamping.

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

1385

if (has_bias()) {

1386

for (size_t i = 0; i < next_batch_size(); i++) {

1387

for (size_t oy = 0; oy < next_output_height(); oy++) {

1388

for (size_t ox = 0; ox < next_output_width(); ox++) {

1389

for (size_t g = 0; g < groups(); g++) {

1390

for (size_t oc = 0; oc < group_output_channels(); oc++) {

1391

next_output_ref[(((i * next_output_height() + oy) * next_output_width() + ox) * groups() + g) * group_output_channels() + oc] =

1392

bias[g * group_output_channels() + oc];

1393

}

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

}

}

}

}

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

1398

} else {

1399

std::fill(next_output_ref.begin(), next_output_ref.end(), 0.0f);

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1400

}

1401

for (size_t i = 0; i < next_batch_size(); i++) {

1402

for (size_t oy = 0; oy < next_output_height(); oy++) {

1403

for (size_t ox = 0; ox < next_output_width(); ox++) {

1404

for (size_t ky = 0; ky < kernel_height(); ky++) {

1405

const size_t iy = oy * subsampling_height() + ky * dilation_height() - padding_top();

1406

if (iy < next_input_height()) {

1407

for (size_t kx = 0; kx < kernel_width(); kx++) {

1408

const size_t ix = ox * subsampling_width() + kx * dilation_width() - padding_left();

1409

if (ix < next_input_width()) {

1410

for (size_t g = 0; g < groups(); g++) {

1411

for (size_t oc = 0; oc < group_output_channels(); oc++) {

1412

for (size_t ic = 0; ic < group_input_channels(); ic++) {

1413

next_output_ref[(((i * next_output_height() + oy) * next_output_width() + ox) * groups() + g) * group_output_channels() + oc] +=

1414

input[((i * next_input_height() + iy) * next_input_width() + ix) * input_pixel_stride() + g * group_input_channels() + ic] *

1415

kernel[(((g * group_output_channels() + oc) * kernel_height() + ky) * kernel_width() + kx) * group_input_channels() + ic];

}

}

}

}

}

}

}

}

}

}

for (float& value : next_output_ref) {

1427

value = std::max(std::min(value, output_max), output_min);

1428

}

1429

1430

// Setup and run Convolution operator the second time, and destroy the operator.

1431

ASSERT_EQ(xnn_status_success,

1432

xnn_setup_convolution2d_nhwc_f32(

1433

convolution_op,

1434

next_batch_size(), next_input_height(), next_input_width(),

1435

input.data(), output.data(),

1436

nullptr /* thread pool */));

1437

1438

ASSERT_EQ(xnn_status_success,

1439

xnn_run_operator(convolution_op, nullptr /* thread pool */));

1440

1441

// Verify results of the second run.

1442

for (size_t i = 0; i < next_batch_size(); i++) {

1443

for (size_t y = 0; y < next_output_height(); y++) {

1444

for (size_t x = 0; x < next_output_width(); x++) {

1445

for (size_t g = 0; g < groups(); g++) {

1446

for (size_t c = 0; c < group_output_channels(); c++) {

1447

ASSERT_GE(output[((i * next_output_height() + y) * next_output_width() + x) * output_pixel_stride() + g * group_output_channels() + c], output_min)

1448

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

1449

ASSERT_LE(output[((i * next_output_height() + y) * next_output_width() + x) * output_pixel_stride() + g * group_output_channels() + c], output_max)

1450

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

1451

ASSERT_NEAR(

1452

next_output_ref[(((i * next_output_height() + y) * next_output_width() + x) * groups() + g) * group_output_channels() + c],

1453

output[((i * next_output_height() + y) * next_output_width() + x) * output_pixel_stride() + g * group_output_channels() + c],

1454

1.0e-4 * std::abs(next_output_ref[(((i * next_output_height() + y) * next_output_width() + x) * groups() + g) * group_output_channels() + c]))

1455

<< "(x, y) = (" << x << ", " << y << "), group = " << g << ", channel = " << c;

}

}

}

}

}

}

}

private:

uint32_t padding_top_{0};

1466

uint32_t padding_right_{0};

1467

uint32_t padding_bottom_{0};

1468

uint32_t padding_left_{0};

Marat Dukhan

2019-10-24 12:46:13 -0700

[diff] [blame]

1469

bool padding_tf_same_{false};

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1470

size_t input_height_{1};

1471

size_t input_width_{1};

1472

uint32_t groups_{1};

1473

size_t group_input_channels_{1};

1474

size_t input_pixel_stride_{0};

Marat Dukhan

2019-11-18 09:25:38 -0800

[diff] [blame]

1475

size_t input_batch_stride_{0};

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1476

size_t group_output_channels_{1};

1477

size_t output_pixel_stride_{0};

Marat Dukhan

2019-11-18 09:25:38 -0800

[diff] [blame]

1478

size_t output_batch_stride_{0};

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1479

size_t batch_size_{1};

1480

uint32_t kernel_height_{1};

1481

uint32_t kernel_width_{1};

1482

uint32_t dilation_height_{1};

1483

uint32_t dilation_width_{1};

1484

uint32_t subsampling_height_{1};

1485

uint32_t subsampling_width_{1};

1486

size_t next_input_height_{0};

1487

size_t next_input_width_{0};

1488

size_t next_batch_size_{0};

Marat Dukhan

2019-11-18 09:25:38 -0800

[diff] [blame]

1489

float sparsity_{0.0f};

XNNPACK Team

2019-09-27 18:10:33 -0700

[diff] [blame]

1490

uint8_t qmin_{0};

1491

uint8_t qmax_{255};

1492

bool depthwise_layout_{false};

Marat Dukhan

2019-11-18 09:25:38 -0800

[diff] [blame]

1493

bool force_nhwc_input_{false};

Marat Dukhan

2019-10-30 09:47:07 -0700

[diff] [blame]

1494

bool has_bias_{true};

XNNPACK Team