You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

146 lines
3.9 KiB

// Copyright 2016 The Gemmlowp Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#ifndef GEMMLOWP_META_BASE_H_
#define GEMMLOWP_META_BASE_H_
#include <cassert>
#include <cstdint>
#include "../internal/common.h"
namespace gemmlowp {
namespace meta {
template <int align>
inline int AlignTo(int value) {
return ((value + align - 1) / align) * align;
}
inline int AlignTo(int align, int value) {
return ((value + align - 1) / align) * align;
}
template <typename Kernel_, typename OutputStream_>
struct FusedKernelParams {
public:
typedef Kernel_ Kernel;
typedef OutputStream_ OutputStream;
Kernel kernel;
OutputStream output_stream;
};
template <typename InType_, typename OutType_, typename LeftStream_,
typename RightStream_, typename Kernel_, typename OutputStream_>
struct GemmParams {
public:
typedef InType_ InType;
typedef OutType_ OutType;
typedef LeftStream_ LeftStream;
typedef RightStream_ RightStream;
typedef Kernel_ Kernel;
typedef OutputStream_ OutputStream;
typedef FusedKernelParams<Kernel, OutputStream> FusedKernel;
// Common parameters.
int m;
int n;
int k;
const InType* lhs;
const InType* rhs;
OutType* result;
std::uint8_t* scratch;
// Specialized parameters.
LeftStream left_stream;
RightStream right_stream;
FusedKernel fused_kernel;
};
template <typename InType, int lanes_count, int pack_size, int leftovers,
typename StreamParams>
class Stream {
public:
static void Pack(const InType* in, const StreamParams& params, InType* out);
static int UnpackedAdvance(const StreamParams& params);
static int PackedAdvance(const StreamParams& params);
static int UnpackedStride(const StreamParams& params);
static int PackedStride(const StreamParams& params);
};
template <typename InType, typename StreamType>
class StreamUtil {
public:
static const InType* Offset(const StreamType& params, const InType* source,
int offset_stride, int offset_advance);
static int Scratch(const StreamType& params, int lanes);
};
template <typename InType, typename OutType, typename Kernel,
typename OutputStream, int kernel_m, int kernel_n, int pack_size>
class MulKernel {
public:
static void Multiply(const InType* lhs, const InType* rhs,
const FusedKernelParams<Kernel, OutputStream>& params,
OutType* result);
};
template <typename InType_, typename OutType_, typename Kernel_>
struct Transform1DParams {
typedef InType_ InType;
typedef OutType_ OutType;
typedef Kernel_ Kernel;
const InType* input;
OutType* output;
std::uint8_t* scratch;
Kernel kernel;
};
template <typename InType, typename OutType, typename Kernel, int kernel_size,
int leftovers>
class Transform1DKernel {
public:
static void Transform(const InType* input, const Kernel& params,
OutType* output);
};
template <typename InType, typename OutType, typename Transform>
class Transform1DUtil {
public:
static int EstimateComputeCost(const Transform& params);
static const InType* OffsetInput(const Transform& params, const InType* input,
int offset);
static OutType* OffsetOutput(const Transform& params, OutType* output,
int offset);
};
} // namespace meta
} // namespace gemmlowp
#endif // GEMMLOWP_META_BASE_H_