brcmsmac/phy/phy_qmath.c

*b4c3e9b5SBjoern A. Zeeb// SPDX-License-Identifier: ISC
*b4c3e9b5SBjoern A. Zeeb/*
*b4c3e9b5SBjoern A. Zeeb * Copyright (c) 2010 Broadcom Corporation
*b4c3e9b5SBjoern A. Zeeb */
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb#include "phy_qmath.h"
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb/*
*b4c3e9b5SBjoern A. Zeeb * Description: This function make 16 bit unsigned multiplication.
*b4c3e9b5SBjoern A. Zeeb * To fit the output into 16 bits the 32 bit multiplication result is right
*b4c3e9b5SBjoern A. Zeeb * shifted by 16 bits.
*b4c3e9b5SBjoern A. Zeeb */
*b4c3e9b5SBjoern A. Zeebu16 qm_mulu16(u16 op1, u16 op2)
*b4c3e9b5SBjoern A. Zeeb{
*b4c3e9b5SBjoern A. Zeeb	return (u16) (((u32) op1 * (u32) op2) >> 16);
*b4c3e9b5SBjoern A. Zeeb}
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb/*
*b4c3e9b5SBjoern A. Zeeb * Description: This function make 16 bit multiplication and return the result
*b4c3e9b5SBjoern A. Zeeb * in 16 bits. To fit the multiplication result into 16 bits the multiplication
*b4c3e9b5SBjoern A. Zeeb * result is right shifted by 15 bits. Right shifting 15 bits instead of 16 bits
*b4c3e9b5SBjoern A. Zeeb * is done to remove the extra sign bit formed due to the multiplication.
*b4c3e9b5SBjoern A. Zeeb * When both the 16bit inputs are 0x8000 then the output is saturated to
*b4c3e9b5SBjoern A. Zeeb * 0x7fffffff.
*b4c3e9b5SBjoern A. Zeeb */
*b4c3e9b5SBjoern A. Zeebs16 qm_muls16(s16 op1, s16 op2)
*b4c3e9b5SBjoern A. Zeeb{
*b4c3e9b5SBjoern A. Zeeb	s32 result;
*b4c3e9b5SBjoern A. Zeeb	if (op1 == (s16) 0x8000 && op2 == (s16) 0x8000)
*b4c3e9b5SBjoern A. Zeeb		result = 0x7fffffff;
*b4c3e9b5SBjoern A. Zeeb	else
*b4c3e9b5SBjoern A. Zeeb		result = ((s32) (op1) * (s32) (op2));
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	return (s16) (result >> 15);
*b4c3e9b5SBjoern A. Zeeb}
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb/*
*b4c3e9b5SBjoern A. Zeeb * Description: This function add two 32 bit numbers and return the 32bit
*b4c3e9b5SBjoern A. Zeeb * result. If the result overflow 32 bits, the output will be saturated to
*b4c3e9b5SBjoern A. Zeeb * 32bits.
*b4c3e9b5SBjoern A. Zeeb */
*b4c3e9b5SBjoern A. Zeebs32 qm_add32(s32 op1, s32 op2)
*b4c3e9b5SBjoern A. Zeeb{
*b4c3e9b5SBjoern A. Zeeb	s32 result;
*b4c3e9b5SBjoern A. Zeeb	result = op1 + op2;
*b4c3e9b5SBjoern A. Zeeb	if (op1 < 0 && op2 < 0 && result > 0)
*b4c3e9b5SBjoern A. Zeeb		result = 0x80000000;
*b4c3e9b5SBjoern A. Zeeb	else if (op1 > 0 && op2 > 0 && result < 0)
*b4c3e9b5SBjoern A. Zeeb		result = 0x7fffffff;
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	return result;
*b4c3e9b5SBjoern A. Zeeb}
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb/*
*b4c3e9b5SBjoern A. Zeeb * Description: This function add two 16 bit numbers and return the 16bit
*b4c3e9b5SBjoern A. Zeeb * result. If the result overflow 16 bits, the output will be saturated to
*b4c3e9b5SBjoern A. Zeeb * 16bits.
*b4c3e9b5SBjoern A. Zeeb */
*b4c3e9b5SBjoern A. Zeebs16 qm_add16(s16 op1, s16 op2)
*b4c3e9b5SBjoern A. Zeeb{
*b4c3e9b5SBjoern A. Zeeb	s16 result;
*b4c3e9b5SBjoern A. Zeeb	s32 temp = (s32) op1 + (s32) op2;
*b4c3e9b5SBjoern A. Zeeb	if (temp > (s32) 0x7fff)
*b4c3e9b5SBjoern A. Zeeb		result = (s16) 0x7fff;
*b4c3e9b5SBjoern A. Zeeb	else if (temp < (s32) 0xffff8000)
*b4c3e9b5SBjoern A. Zeeb		result = (s16) 0xffff8000;
*b4c3e9b5SBjoern A. Zeeb	else
*b4c3e9b5SBjoern A. Zeeb		result = (s16) temp;
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	return result;
*b4c3e9b5SBjoern A. Zeeb}
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb/*
*b4c3e9b5SBjoern A. Zeeb * Description: This function make 16 bit subtraction and return the 16bit
*b4c3e9b5SBjoern A. Zeeb * result. If the result overflow 16 bits, the output will be saturated to
*b4c3e9b5SBjoern A. Zeeb * 16bits.
*b4c3e9b5SBjoern A. Zeeb */
*b4c3e9b5SBjoern A. Zeebs16 qm_sub16(s16 op1, s16 op2)
*b4c3e9b5SBjoern A. Zeeb{
*b4c3e9b5SBjoern A. Zeeb	s16 result;
*b4c3e9b5SBjoern A. Zeeb	s32 temp = (s32) op1 - (s32) op2;
*b4c3e9b5SBjoern A. Zeeb	if (temp > (s32) 0x7fff)
*b4c3e9b5SBjoern A. Zeeb		result = (s16) 0x7fff;
*b4c3e9b5SBjoern A. Zeeb	else if (temp < (s32) 0xffff8000)
*b4c3e9b5SBjoern A. Zeeb		result = (s16) 0xffff8000;
*b4c3e9b5SBjoern A. Zeeb	else
*b4c3e9b5SBjoern A. Zeeb		result = (s16) temp;
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	return result;
*b4c3e9b5SBjoern A. Zeeb}
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb/*
*b4c3e9b5SBjoern A. Zeeb * Description: This function make a 32 bit saturated left shift when the
*b4c3e9b5SBjoern A. Zeeb * specified shift is +ve. This function will make a 32 bit right shift when
*b4c3e9b5SBjoern A. Zeeb * the specified shift is -ve. This function return the result after shifting
*b4c3e9b5SBjoern A. Zeeb * operation.
*b4c3e9b5SBjoern A. Zeeb */
*b4c3e9b5SBjoern A. Zeebs32 qm_shl32(s32 op, int shift)
*b4c3e9b5SBjoern A. Zeeb{
*b4c3e9b5SBjoern A. Zeeb	int i;
*b4c3e9b5SBjoern A. Zeeb	s32 result;
*b4c3e9b5SBjoern A. Zeeb	result = op;
*b4c3e9b5SBjoern A. Zeeb	if (shift > 31)
*b4c3e9b5SBjoern A. Zeeb		shift = 31;
*b4c3e9b5SBjoern A. Zeeb	else if (shift < -31)
*b4c3e9b5SBjoern A. Zeeb		shift = -31;
*b4c3e9b5SBjoern A. Zeeb	if (shift >= 0) {
*b4c3e9b5SBjoern A. Zeeb		for (i = 0; i < shift; i++)
*b4c3e9b5SBjoern A. Zeeb			result = qm_add32(result, result);
*b4c3e9b5SBjoern A. Zeeb	} else {
*b4c3e9b5SBjoern A. Zeeb		result = result >> (-shift);
*b4c3e9b5SBjoern A. Zeeb	}
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	return result;
*b4c3e9b5SBjoern A. Zeeb}
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb/*
*b4c3e9b5SBjoern A. Zeeb * Description: This function make a 16 bit saturated left shift when the
*b4c3e9b5SBjoern A. Zeeb * specified shift is +ve. This function will make a 16 bit right shift when
*b4c3e9b5SBjoern A. Zeeb * the specified shift is -ve. This function return the result after shifting
*b4c3e9b5SBjoern A. Zeeb * operation.
*b4c3e9b5SBjoern A. Zeeb */
*b4c3e9b5SBjoern A. Zeebs16 qm_shl16(s16 op, int shift)
*b4c3e9b5SBjoern A. Zeeb{
*b4c3e9b5SBjoern A. Zeeb	int i;
*b4c3e9b5SBjoern A. Zeeb	s16 result;
*b4c3e9b5SBjoern A. Zeeb	result = op;
*b4c3e9b5SBjoern A. Zeeb	if (shift > 15)
*b4c3e9b5SBjoern A. Zeeb		shift = 15;
*b4c3e9b5SBjoern A. Zeeb	else if (shift < -15)
*b4c3e9b5SBjoern A. Zeeb		shift = -15;
*b4c3e9b5SBjoern A. Zeeb	if (shift > 0) {
*b4c3e9b5SBjoern A. Zeeb		for (i = 0; i < shift; i++)
*b4c3e9b5SBjoern A. Zeeb			result = qm_add16(result, result);
*b4c3e9b5SBjoern A. Zeeb	} else {
*b4c3e9b5SBjoern A. Zeeb		result = result >> (-shift);
*b4c3e9b5SBjoern A. Zeeb	}
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	return result;
*b4c3e9b5SBjoern A. Zeeb}
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb/*
*b4c3e9b5SBjoern A. Zeeb * Description: This function make a 16 bit right shift when shift is +ve.
*b4c3e9b5SBjoern A. Zeeb * This function make a 16 bit saturated left shift when shift is -ve. This
*b4c3e9b5SBjoern A. Zeeb * function return the result of the shift operation.
*b4c3e9b5SBjoern A. Zeeb */
*b4c3e9b5SBjoern A. Zeebs16 qm_shr16(s16 op, int shift)
*b4c3e9b5SBjoern A. Zeeb{
*b4c3e9b5SBjoern A. Zeeb	return qm_shl16(op, -shift);
*b4c3e9b5SBjoern A. Zeeb}
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb/*
*b4c3e9b5SBjoern A. Zeeb * Description: This function return the number of redundant sign bits in a
*b4c3e9b5SBjoern A. Zeeb * 32 bit number. Example: qm_norm32(0x00000080) = 23
*b4c3e9b5SBjoern A. Zeeb */
*b4c3e9b5SBjoern A. Zeebs16 qm_norm32(s32 op)
*b4c3e9b5SBjoern A. Zeeb{
*b4c3e9b5SBjoern A. Zeeb	u16 u16extraSignBits;
*b4c3e9b5SBjoern A. Zeeb	if (op == 0) {
*b4c3e9b5SBjoern A. Zeeb		return 31;
*b4c3e9b5SBjoern A. Zeeb	} else {
*b4c3e9b5SBjoern A. Zeeb		u16extraSignBits = 0;
*b4c3e9b5SBjoern A. Zeeb		while ((op >> 31) == (op >> 30)) {
*b4c3e9b5SBjoern A. Zeeb			u16extraSignBits++;
*b4c3e9b5SBjoern A. Zeeb			op = op << 1;
*b4c3e9b5SBjoern A. Zeeb		}
*b4c3e9b5SBjoern A. Zeeb	}
*b4c3e9b5SBjoern A. Zeeb	return u16extraSignBits;
*b4c3e9b5SBjoern A. Zeeb}
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb/* This table is log2(1+(i/32)) where i=[0:1:32], in q.15 format */
*b4c3e9b5SBjoern A. Zeebstatic const s16 log_table[] = {
*b4c3e9b5SBjoern A. Zeeb	0,
*b4c3e9b5SBjoern A. Zeeb	1455,
*b4c3e9b5SBjoern A. Zeeb	2866,
*b4c3e9b5SBjoern A. Zeeb	4236,
*b4c3e9b5SBjoern A. Zeeb	5568,
*b4c3e9b5SBjoern A. Zeeb	6863,
*b4c3e9b5SBjoern A. Zeeb	8124,
*b4c3e9b5SBjoern A. Zeeb	9352,
*b4c3e9b5SBjoern A. Zeeb	10549,
*b4c3e9b5SBjoern A. Zeeb	11716,
*b4c3e9b5SBjoern A. Zeeb	12855,
*b4c3e9b5SBjoern A. Zeeb	13968,
*b4c3e9b5SBjoern A. Zeeb	15055,
*b4c3e9b5SBjoern A. Zeeb	16117,
*b4c3e9b5SBjoern A. Zeeb	17156,
*b4c3e9b5SBjoern A. Zeeb	18173,
*b4c3e9b5SBjoern A. Zeeb	19168,
*b4c3e9b5SBjoern A. Zeeb	20143,
*b4c3e9b5SBjoern A. Zeeb	21098,
*b4c3e9b5SBjoern A. Zeeb	22034,
*b4c3e9b5SBjoern A. Zeeb	22952,
*b4c3e9b5SBjoern A. Zeeb	23852,
*b4c3e9b5SBjoern A. Zeeb	24736,
*b4c3e9b5SBjoern A. Zeeb	25604,
*b4c3e9b5SBjoern A. Zeeb	26455,
*b4c3e9b5SBjoern A. Zeeb	27292,
*b4c3e9b5SBjoern A. Zeeb	28114,
*b4c3e9b5SBjoern A. Zeeb	28922,
*b4c3e9b5SBjoern A. Zeeb	29717,
*b4c3e9b5SBjoern A. Zeeb	30498,
*b4c3e9b5SBjoern A. Zeeb	31267,
*b4c3e9b5SBjoern A. Zeeb	32024,
*b4c3e9b5SBjoern A. Zeeb	32767
*b4c3e9b5SBjoern A. Zeeb};
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb#define LOG_TABLE_SIZE 32       /* log_table size */
*b4c3e9b5SBjoern A. Zeeb#define LOG2_LOG_TABLE_SIZE 5   /* log2(log_table size) */
*b4c3e9b5SBjoern A. Zeeb#define Q_LOG_TABLE 15          /* qformat of log_table */
*b4c3e9b5SBjoern A. Zeeb#define LOG10_2         19728   /* log10(2) in q.16 */
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb/*
*b4c3e9b5SBjoern A. Zeeb * Description:
*b4c3e9b5SBjoern A. Zeeb * This routine takes the input number N and its q format qN and compute
*b4c3e9b5SBjoern A. Zeeb * the log10(N). This routine first normalizes the input no N.	Then N is in
*b4c3e9b5SBjoern A. Zeeb * mag*(2^x) format. mag is any number in the range 2^30-(2^31 - 1).
*b4c3e9b5SBjoern A. Zeeb * Then log2(mag * 2^x) = log2(mag) + x is computed. From that
*b4c3e9b5SBjoern A. Zeeb * log10(mag * 2^x) = log2(mag * 2^x) * log10(2) is computed.
*b4c3e9b5SBjoern A. Zeeb * This routine looks the log2 value in the table considering
*b4c3e9b5SBjoern A. Zeeb * LOG2_LOG_TABLE_SIZE+1 MSBs. As the MSB is always 1, only next
*b4c3e9b5SBjoern A. Zeeb * LOG2_OF_LOG_TABLE_SIZE MSBs are used for table lookup. Next 16 MSBs are used
*b4c3e9b5SBjoern A. Zeeb * for interpolation.
*b4c3e9b5SBjoern A. Zeeb * Inputs:
*b4c3e9b5SBjoern A. Zeeb * N - number to which log10 has to be found.
*b4c3e9b5SBjoern A. Zeeb * qN - q format of N
*b4c3e9b5SBjoern A. Zeeb * log10N - address where log10(N) will be written.
*b4c3e9b5SBjoern A. Zeeb * qLog10N - address where log10N qformat will be written.
*b4c3e9b5SBjoern A. Zeeb * Note/Problem:
*b4c3e9b5SBjoern A. Zeeb * For accurate results input should be in normalized or near normalized form.
*b4c3e9b5SBjoern A. Zeeb */
*b4c3e9b5SBjoern A. Zeebvoid qm_log10(s32 N, s16 qN, s16 *log10N, s16 *qLog10N)
*b4c3e9b5SBjoern A. Zeeb{
*b4c3e9b5SBjoern A. Zeeb	s16 s16norm, s16tableIndex, s16errorApproximation;
*b4c3e9b5SBjoern A. Zeeb	u16 u16offset;
*b4c3e9b5SBjoern A. Zeeb	s32 s32log;
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* normalize the N. */
*b4c3e9b5SBjoern A. Zeeb	s16norm = qm_norm32(N);
*b4c3e9b5SBjoern A. Zeeb	N = N << s16norm;
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* The qformat of N after normalization.
*b4c3e9b5SBjoern A. Zeeb	 * -30 is added to treat the no as between 1.0 to 2.0
*b4c3e9b5SBjoern A. Zeeb	 * i.e. after adding the -30 to the qformat the decimal point will be
*b4c3e9b5SBjoern A. Zeeb	 * just rigtht of the MSB. (i.e. after sign bit and 1st MSB). i.e.
*b4c3e9b5SBjoern A. Zeeb	 * at the right side of 30th bit.
*b4c3e9b5SBjoern A. Zeeb	 */
*b4c3e9b5SBjoern A. Zeeb	qN = qN + s16norm - 30;
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* take the table index as the LOG2_OF_LOG_TABLE_SIZE bits right of the
*b4c3e9b5SBjoern A. Zeeb	 * MSB */
*b4c3e9b5SBjoern A. Zeeb	s16tableIndex = (s16) (N >> (32 - (2 + LOG2_LOG_TABLE_SIZE)));
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* remove the MSB. the MSB is always 1 after normalization. */
*b4c3e9b5SBjoern A. Zeeb	s16tableIndex =
*b4c3e9b5SBjoern A. Zeeb		s16tableIndex & (s16) ((1 << LOG2_LOG_TABLE_SIZE) - 1);
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* remove the (1+LOG2_OF_LOG_TABLE_SIZE) MSBs in the N. */
*b4c3e9b5SBjoern A. Zeeb	N = N & ((1 << (32 - (2 + LOG2_LOG_TABLE_SIZE))) - 1);
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* take the offset as the 16 MSBS after table index.
*b4c3e9b5SBjoern A. Zeeb	 */
*b4c3e9b5SBjoern A. Zeeb	u16offset = (u16) (N >> (32 - (2 + LOG2_LOG_TABLE_SIZE + 16)));
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* look the log value in the table. */
*b4c3e9b5SBjoern A. Zeeb	s32log = log_table[s16tableIndex];      /* q.15 format */
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* interpolate using the offset. q.15 format. */
*b4c3e9b5SBjoern A. Zeeb	s16errorApproximation = (s16) qm_mulu16(u16offset,
*b4c3e9b5SBjoern A. Zeeb				(u16) (log_table[s16tableIndex + 1] -
*b4c3e9b5SBjoern A. Zeeb				       log_table[s16tableIndex]));
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	 /* q.15 format */
*b4c3e9b5SBjoern A. Zeeb	s32log = qm_add16((s16) s32log, s16errorApproximation);
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* adjust for the qformat of the N as
*b4c3e9b5SBjoern A. Zeeb	 * log2(mag * 2^x) = log2(mag) + x
*b4c3e9b5SBjoern A. Zeeb	 */
*b4c3e9b5SBjoern A. Zeeb	s32log = qm_add32(s32log, ((s32) -qN) << 15);   /* q.15 format */
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* normalize the result. */
*b4c3e9b5SBjoern A. Zeeb	s16norm = qm_norm32(s32log);
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* bring all the important bits into lower 16 bits */
*b4c3e9b5SBjoern A. Zeeb	/* q.15+s16norm-16 format */
*b4c3e9b5SBjoern A. Zeeb	s32log = qm_shl32(s32log, s16norm - 16);
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* compute the log10(N) by multiplying log2(N) with log10(2).
*b4c3e9b5SBjoern A. Zeeb	 * as log10(mag * 2^x) = log2(mag * 2^x) * log10(2)
*b4c3e9b5SBjoern A. Zeeb	 * log10N in q.15+s16norm-16+1 (LOG10_2 is in q.16)
*b4c3e9b5SBjoern A. Zeeb	 */
*b4c3e9b5SBjoern A. Zeeb	*log10N = qm_muls16((s16) s32log, (s16) LOG10_2);
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	/* write the q format of the result. */
*b4c3e9b5SBjoern A. Zeeb	*qLog10N = 15 + s16norm - 16 + 1;
*b4c3e9b5SBjoern A. Zeeb
*b4c3e9b5SBjoern A. Zeeb	return;
*b4c3e9b5SBjoern A. Zeeb}