MastersThesis/PQ_TIIGER_TLS/sal/miracl-ubuntu22-11-04-24/includes/fp16.cpp

/*
 * Copyright (c) 2012-2020 MIRACL UK Ltd.
 *
 * This file is part of MIRACL Core
 * (see https://github.com/miracl/core).
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

/* CORE Fp^8 functions */

/* FP16 elements are of the form a+ib, where i is sqrt(sqrt(-1+sqrt(-1))) */

#include "fp16_YYY.h"

using namespace XXX;

/* test x==0 ? */
int YYY::FP16_iszilch(FP16 *x)
{
    if (FP8_iszilch(&(x->a)) && FP8_iszilch(&(x->b))) return 1;
    return 0;
}

/* test x==1 ? */
int YYY::FP16_isunity(FP16 *x)
{
    if (FP8_isunity(&(x->a)) && FP8_iszilch(&(x->b))) return 1;
    return 0;
}

/* test is w real? That is in a+ib test b is zero */
int YYY::FP16_isreal(FP16 *w)
{
    return FP8_iszilch(&(w->b));
}

/* return 1 if x==y, else 0 */
int YYY::FP16_equals(FP16 *x, FP16 *y)
{
    if (FP8_equals(&(x->a), &(y->a)) && FP8_equals(&(x->b), &(y->b)))
        return 1;
    return 0;
}


void YYY::FP16_toBytes(char *b,FP16 *x)
{
    FP8_toBytes(b,&(x->b));
    FP8_toBytes(&b[8*MODBYTES_XXX],&(x->a));
}

void YYY::FP16_fromBytes(FP16 *x,char *b)
{
    FP8_fromBytes(&(x->b),b);
    FP8_fromBytes(&(x->a),&b[8*MODBYTES_XXX]);
}


/* set FP16 from two FP8s */
void YYY::FP16_from_FP8s(FP16 *w, FP8 * x, FP8* y)
{
    FP8_copy(&(w->a), x);
    FP8_copy(&(w->b), y);
}

/* set FP16 from FP8 */
void YYY::FP16_from_FP8(FP16 *w, FP8 *x)
{
    FP8_copy(&(w->a), x);
    FP8_zero(&(w->b));
}

/* set high part of FP16 from FP8 */
void YYY::FP16_from_FP8H(FP16 *w, FP8 *x)
{
    FP8_copy(&(w->b), x);
    FP8_zero(&(w->a));
}

/* FP16 copy w=x */
void YYY::FP16_copy(FP16 *w, FP16 *x)
{
    if (w == x) return;
    FP8_copy(&(w->a), &(x->a));
    FP8_copy(&(w->b), &(x->b));
}

/* FP16 w=0 */
void YYY::FP16_zero(FP16 *w)
{
    FP8_zero(&(w->a));
    FP8_zero(&(w->b));
}

/* FP16 w=1 */
void YYY::FP16_one(FP16 *w)
{
    FP8_one(&(w->a));
    FP8_zero(&(w->b));
}

/* Set w=-x */
void YYY::FP16_neg(FP16 *w, FP16 *x)
{
    /* Just one field neg */
    FP8 m, t;
    FP16_norm(x);
    FP8_add(&m, &(x->a), &(x->b));
    FP8_norm(&m);
    FP8_neg(&m, &m);
    FP8_add(&t, &m, &(x->b));
    FP8_add(&(w->b), &m, &(x->a));
    FP8_copy(&(w->a), &t);
    FP16_norm(w);
}

/* Set w=conj(x) */
void YYY::FP16_conj(FP16 *w, FP16 *x)
{
    FP8_copy(&(w->a), &(x->a));
    FP8_neg(&(w->b), &(x->b));
    FP16_norm(w);
}

/* Set w=-conj(x) */
void YYY::FP16_nconj(FP16 *w, FP16 *x)
{
    FP8_copy(&(w->b), &(x->b));
    FP8_neg(&(w->a), &(x->a));
    FP16_norm(w);
}

/* Set w=x+y */
void YYY::FP16_add(FP16 *w, FP16 *x, FP16 *y)
{
    FP8_add(&(w->a), &(x->a), &(y->a));
    FP8_add(&(w->b), &(x->b), &(y->b));
}

/* Set w=x-y */
/* Input y MUST be normed */
void YYY::FP16_sub(FP16 *w, FP16 *x, FP16 *y)
{
    FP16 my;

    FP16_neg(&my, y);
    FP16_add(w, x, &my);

}

/* reduce all components of w mod Modulus */
void YYY::FP16_reduce(FP16 *w)
{
    FP8_reduce(&(w->a));
    FP8_reduce(&(w->b));
}

/* normalise all elements of w */
void YYY::FP16_norm(FP16 *w)
{
    FP8_norm(&(w->a));
    FP8_norm(&(w->b));
}

/* Set w=s*x, where s is FP8 */
void YYY::FP16_pmul(FP16 *w, FP16 *x, FP8 *s)
{
    FP8_mul(&(w->a), &(x->a), s);
    FP8_mul(&(w->b), &(x->b), s);
}

/* Set w=s*x, where s is FP2 */
void YYY::FP16_qmul(FP16 *w, FP16 *x, FP2 *s)
{
    FP8_qmul(&(w->a), &(x->a), s);
    FP8_qmul(&(w->b), &(x->b), s);
}

/* Set w=s*x, where s is FP */
void YYY::FP16_tmul(FP16 *w, FP16 *x, FP *s)
{
    FP8_tmul(&(w->a), &(x->a), s);
    FP8_tmul(&(w->b), &(x->b), s);
}

/* Set w=s*x, where s is int */
void YYY::FP16_imul(FP16 *w, FP16 *x, int s)
{
    FP8_imul(&(w->a), &(x->a), s);
    FP8_imul(&(w->b), &(x->b), s);
}

/* Set w=x^2 */
/* Input MUST be normed  */
void YYY::FP16_sqr(FP16 *w, FP16 *x)
{
    FP8 t1, t2, t3;

    FP8_mul(&t3, &(x->a), &(x->b)); /* norms x */
    FP8_copy(&t2, &(x->b));
    FP8_add(&t1, &(x->a), &(x->b));
    FP8_times_i(&t2);

    FP8_add(&t2, &(x->a), &t2);

    FP8_norm(&t1);  // 2
    FP8_norm(&t2);  // 2

    FP8_mul(&(w->a), &t1, &t2);

    FP8_copy(&t2, &t3);
    FP8_times_i(&t2);

    FP8_add(&t2, &t2, &t3);

    FP8_norm(&t2);  // 2
    FP8_neg(&t2, &t2);
    FP8_add(&(w->a), &(w->a), &t2); /* a=(a+b)(a+i^2.b)-i^2.ab-ab = a*a+ib*ib */
    FP8_add(&(w->b), &t3, &t3); /* b=2ab */

    FP16_norm(w);
}

/* Set w=x*y */
/* Inputs MUST be normed  */
void YYY::FP16_mul(FP16 *w, FP16 *x, FP16 *y)
{

    FP8 t1, t2, t3, t4;
    FP8_mul(&t1, &(x->a), &(y->a));
    FP8_mul(&t2, &(x->b), &(y->b));

    FP8_add(&t3, &(y->b), &(y->a));
    FP8_add(&t4, &(x->b), &(x->a));

    FP8_norm(&t4); // 2
    FP8_norm(&t3); // 2

    FP8_mul(&t4, &t4, &t3); /* (xa+xb)(ya+yb) */
    FP8_neg(&t3, &t1); // 1
    FP8_add(&t4, &t4, &t3); //t4E=3
    FP8_norm(&t4);

    FP8_neg(&t3, &t2); // 1
    FP8_add(&(w->b), &t4, &t3); //wbE=3

    FP8_times_i(&t2);
    FP8_add(&(w->a), &t2, &t1);

    FP16_norm(w);
}

/* output FP16 in format [a,b] */
void YYY::FP16_output(FP16 *w)
{
    printf("[");
    FP8_output(&(w->a));
    printf(",");
    FP8_output(&(w->b));
    printf("]");
}

void YYY::FP16_rawoutput(FP16 *w)
{
    printf("[");
    FP8_rawoutput(&(w->a));
    printf(",");
    FP8_rawoutput(&(w->b));
    printf("]");
}

/* Set w=1/x */
void YYY::FP16_inv(FP16 *w, FP16 *x)
{
    FP8 t1, t2;
    FP8_sqr(&t1, &(x->a));
    FP8_sqr(&t2, &(x->b));
    FP8_times_i(&t2);
    FP8_norm(&t2);

    FP8_sub(&t1, &t1, &t2);
    FP8_norm(&t1);

    FP8_inv(&t1, &t1, NULL);

    FP8_mul(&(w->a), &t1, &(x->a));
    FP8_neg(&t1, &t1);
    FP8_norm(&t1);
    FP8_mul(&(w->b), &t1, &(x->b));
}

/* w*=i where i = sqrt(sqrt(-1+sqrt(-1))) */
void YYY::FP16_times_i(FP16 *w)
{
    FP8 s, t;
    FP8_copy(&s, &(w->b));
    FP8_copy(&t, &(w->a));
    FP8_times_i(&s);
    FP8_copy(&(w->a), &s);
    FP8_copy(&(w->b), &t);
    FP16_norm(w);

    //FP16_neg(w,w);   // ***
    //FP16_norm(w);
}

void YYY::FP16_times_i2(FP16 *w)
{
    FP8_times_i(&(w->a));
    FP8_times_i(&(w->b));
}

void YYY::FP16_times_i4(FP16 *w)
{
    FP8_times_i2(&(w->a));
    FP8_times_i2(&(w->b));
}

/* Set w=w^p using Frobenius */
void YYY::FP16_frob(FP16 *w, FP2 *f)
{   // f=(i+1)^(p-3)/8
    FP2 ff;
    FP2_sqr(&ff, f); // (i+1)^(p-3)/4
    FP2_norm(&ff);

    FP8_frob(&(w->a), &ff);
    FP8_frob(&(w->b), &ff);

    FP8_qmul(&(w->b), &(w->b), f); // times (1+i)^(p-3)/8
    FP8_times_i(&(w->b));       // (i+1)^(p-1)/8
}

/* Set r=a^b mod m */
void YYY::FP16_pow(FP16 *r, FP16* a, BIG b)
{
    FP16 w;
    BIG z, zilch;
    int bt;

    BIG_zero(zilch);

    BIG_copy(z, b);
    FP16_copy(&w, a);
    FP16_one(r);
    BIG_norm(z);
    while (1)
    {
        bt = BIG_parity(z);
        BIG_shr(z, 1);
        if (bt) FP16_mul(r, r, &w);
        if (BIG_comp(z, zilch) == 0) break;
        FP16_sqr(&w, &w);
    }
    FP16_reduce(r);
}

/* Move b to a if d=1 */
void YYY::FP16_cmove(FP16 *f, FP16 *g, int d)
{
    FP8_cmove(&(f->a), &(g->a), d);
    FP8_cmove(&(f->b), &(g->b), d);
}

//#if CURVE_SECURITY_ZZZ == 256

/* XTR xtr_a function */
/*
void YYY::FP16_xtr_A(FP16 *r, FP16 *w, FP16 *x, FP16 *y, FP16 *z)
{
    FP16 t1, t2;

    FP16_copy(r, x);
    FP16_sub(&t1, w, y);
    FP16_norm(&t1);
    FP16_pmul(&t1, &t1, &(r->a));
    FP16_add(&t2, w, y);
    FP16_norm(&t2);
    FP16_pmul(&t2, &t2, &(r->b));
    FP16_times_i(&t2);

    FP16_add(r, &t1, &t2);
    FP16_add(r, r, z);

    FP16_reduce(r);
}
*/
/* XTR xtr_d function */
/*
void YYY::FP16_xtr_D(FP16 *r, FP16 *x)
{
    FP16 w;
    FP16_copy(r, x);
    FP16_conj(&w, r);
    FP16_add(&w, &w, &w);
    FP16_sqr(r, r);
    FP16_norm(&w);
    FP16_sub(r, r, &w);
    FP16_reduce(r);    // reduce here as multiple calls trigger automatic reductions
}
*/

/* r=x^n using XTR method on traces of FP48s */
/*
void YYY::FP16_xtr_pow(FP16 *r, FP16 *x, BIG n)
{
    int i, par, nb;
    BIG v;
    FP2 w2;
    FP4 w4;
    FP8 w8;
    FP16 t, a, b, c, sf;

    FP16_copy(&sf, x);
    FP16_norm(&sf);
    BIG_zero(v);
    BIG_inc(v, 3);
    BIG_norm(v);
    FP2_from_BIG(&w2, v);
    FP4_from_FP2(&w4, &w2);
    FP8_from_FP4(&w8, &w4);
    FP16_from_FP8(&a, &w8);

    FP16_copy(&b, &sf);
    FP16_xtr_D(&c, &sf);


    par = BIG_parity(n);
    BIG_copy(v, n);
    BIG_norm(v);
    BIG_shr(v, 1);
    if (par == 0)
    {
        BIG_dec(v, 1);
        BIG_norm(v);
    }

    nb = BIG_nbits(v);
    for (i = nb - 1; i >= 0; i--)
    {
        if (!BIG_bit(v, i))
        {
            FP16_copy(&t, &b);
            FP16_conj(&sf, &sf);
            FP16_conj(&c, &c);
            FP16_xtr_A(&b, &a, &b, &sf, &c);
            FP16_conj(&sf, &sf);
            FP16_xtr_D(&c, &t);
            FP16_xtr_D(&a, &a);
        }
        else
        {
            FP16_conj(&t, &a);
            FP16_xtr_D(&a, &b);
            FP16_xtr_A(&b, &c, &b, &sf, &t);
            FP16_xtr_D(&c, &c);
        }
    }

    if (par == 0) FP16_copy(r, &c);
    else FP16_copy(r, &b);
    FP16_reduce(r);
}
*/
/* r=ck^a.cl^n using XTR double exponentiation method on traces of FP48s. See Stam thesis. */
/*
void YYY::FP16_xtr_pow2(FP16 *r, FP16 *ck, FP16 *cl, FP16 *ckml, FP16 *ckm2l, BIG a, BIG b)
{
    int i, f2;
    BIG d, e, w;
    FP16 t, cu, cv, cumv, cum2v;


    BIG_copy(e, a);
    BIG_copy(d, b);
    BIG_norm(d);
    BIG_norm(e);
    FP16_copy(&cu, ck);
    FP16_copy(&cv, cl);
    FP16_copy(&cumv, ckml);
    FP16_copy(&cum2v, ckm2l);

    f2 = 0;
    while (BIG_parity(d) == 0 && BIG_parity(e) == 0)
    {
        BIG_shr(d, 1);
        BIG_shr(e, 1);
        f2++;
    }
    while (BIG_comp(d, e) != 0)
    {
        if (BIG_comp(d, e) > 0)
        {
            BIG_imul(w, e, 4);
            BIG_norm(w);
            if (BIG_comp(d, w) <= 0)
            {
                BIG_copy(w, d);
                BIG_copy(d, e);
                BIG_sub(e, w, e);
                BIG_norm(e);
                FP16_xtr_A(&t, &cu, &cv, &cumv, &cum2v);
                FP16_conj(&cum2v, &cumv);
                FP16_copy(&cumv, &cv);
                FP16_copy(&cv, &cu);
                FP16_copy(&cu, &t);
            }
            else if (BIG_parity(d) == 0)
            {
                BIG_shr(d, 1);
                FP16_conj(r, &cum2v);
                FP16_xtr_A(&t, &cu, &cumv, &cv, r);
                FP16_xtr_D(&cum2v, &cumv);
                FP16_copy(&cumv, &t);
                FP16_xtr_D(&cu, &cu);
            }
            else if (BIG_parity(e) == 1)
            {
                BIG_sub(d, d, e);
                BIG_norm(d);
                BIG_shr(d, 1);
                FP16_xtr_A(&t, &cu, &cv, &cumv, &cum2v);
                FP16_xtr_D(&cu, &cu);
                FP16_xtr_D(&cum2v, &cv);
                FP16_conj(&cum2v, &cum2v);
                FP16_copy(&cv, &t);
            }
            else
            {
                BIG_copy(w, d);
                BIG_copy(d, e);
                BIG_shr(d, 1);
                BIG_copy(e, w);
                FP16_xtr_D(&t, &cumv);
                FP16_conj(&cumv, &cum2v);
                FP16_conj(&cum2v, &t);
                FP16_xtr_D(&t, &cv);
                FP16_copy(&cv, &cu);
                FP16_copy(&cu, &t);
            }
        }
        if (BIG_comp(d, e) < 0)
        {
            BIG_imul(w, d, 4);
            BIG_norm(w);
            if (BIG_comp(e, w) <= 0)
            {
                BIG_sub(e, e, d);
                BIG_norm(e);
                FP16_xtr_A(&t, &cu, &cv, &cumv, &cum2v);
                FP16_copy(&cum2v, &cumv);
                FP16_copy(&cumv, &cu);
                FP16_copy(&cu, &t);
            }
            else if (BIG_parity(e) == 0)
            {
                BIG_copy(w, d);
                BIG_copy(d, e);
                BIG_shr(d, 1);
                BIG_copy(e, w);
                FP16_xtr_D(&t, &cumv);
                FP16_conj(&cumv, &cum2v);
                FP16_conj(&cum2v, &t);
                FP16_xtr_D(&t, &cv);
                FP16_copy(&cv, &cu);
                FP16_copy(&cu, &t);
            }
            else if (BIG_parity(d) == 1)
            {
                BIG_copy(w, e);
                BIG_copy(e, d);
                BIG_sub(w, w, d);
                BIG_norm(w);
                BIG_copy(d, w);
                BIG_shr(d, 1);
                FP16_xtr_A(&t, &cu, &cv, &cumv, &cum2v);
                FP16_conj(&cumv, &cumv);
                FP16_xtr_D(&cum2v, &cu);
                FP16_conj(&cum2v, &cum2v);
                FP16_xtr_D(&cu, &cv);
                FP16_copy(&cv, &t);
            }
            else
            {
                BIG_shr(d, 1);
                FP16_conj(r, &cum2v);
                FP16_xtr_A(&t, &cu, &cumv, &cv, r);
                FP16_xtr_D(&cum2v, &cumv);
                FP16_copy(&cumv, &t);
                FP16_xtr_D(&cu, &cu);
            }
        }
    }
    FP16_xtr_A(r, &cu, &cv, &cumv, &cum2v);
    for (i = 0; i < f2; i++)    FP16_xtr_D(r, r);
    FP16_xtr_pow(r, r, d);
}

#endif
*/