| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708 | #ifndef MANDEL_FIXED128_H#define MANDEL_FIXED128_H#ifdef _MSC_VER#   include <intrin.h>#endif#include <cinttypes>#include <cmath>#include <utility>#include <array>#include <vector>#include <boost/serialization/nvp.hpp>#include <boost/multiprecision/cpp_int.hpp>#include <boost/multiprecision/cpp_bin_float.hpp>namespace mnd{#if defined(_MSC_VER) && defined(_WIN64)    static inline std::pair<int64_t, uint64_t> mul64(int64_t a, int64_t b) {        int64_t higher;        int64_t lower = _mul128(a, b, &higher);        return { higher, lower };    }    static inline std::pair<uint64_t, uint64_t> mulu64(uint64_t a, uint64_t b) {        uint64_t higher;        uint64_t lower = _umul128(a, b, &higher);        return { higher, lower };    }#elif defined(__SIZEOF_INT128__)    static inline std::pair<int64_t, uint64_t> mul64(int64_t a, int64_t b) {        __int128_t result = __int128_t(a) * __int128_t(b);        return { result >> 64, uint64_t(result & 0xFFFFFFFFFFFFFFFFULL) };    }    static inline std::pair<uint64_t, uint64_t> mulu64(uint64_t a, uint64_t b) {        __uint128_t result = __uint128_t(a) * __uint128_t(b);        return { result >> 64, uint64_t(result & 0xFFFFFFFFFFFFFFFFULL) };    }#else    static inline std::pair<int64_t, uint64_t> mul64(int64_t a, int64_t b) {        uint32_t aa[2] = { uint32_t(a >> 32), uint32_t(a & 0xFFFFFFFF) };        uint32_t bb[2] = { uint32_t(b >> 32), uint32_t(b & 0xFFFFFFFF) };        uint32_t res[4];        int64_t temp = uint64_t(aa[1]) * uint64_t(bb[1]);        res[3] = temp & 0xFFFFFFFF;        temp >>= 32;        temp += int64_t(int32_t(aa[0])) * int64_t(bb[1]) + int64_t(aa[1]) * int64_t(int32_t(bb[0]));        res[2] = temp & 0xFFFFFFFF;        temp >>= 32;        temp += int64_t(int32_t(aa[0])) * int64_t(int32_t(bb[0]));        res[1] = temp & 0xFFFFFFFF;        res[0] = temp >> 32;        return std::make_pair((int64_t(res[0]) << 32) | res[1], uint64_t((int64_t(res[2]) << 32) | res[3]));    }    static inline std::pair<uint64_t, uint64_t> mulu64(uint64_t a, uint64_t b) {        uint32_t aa[2] = { uint32_t(a >> 32), uint32_t(a & 0xFFFFFFFF) };        uint32_t bb[2] = { uint32_t(b >> 32), uint32_t(b & 0xFFFFFFFF) };        uint32_t res[4];        uint64_t temp = uint64_t(aa[1]) * bb[1];        res[3] = temp & 0xFFFFFFFF;        uint32_t carry = temp >> 32;        temp = uint64_t(aa[0]) * bb[1] + uint64_t(aa[1]) * bb[0] + carry;        res[2] = temp & 0xFFFFFFFF;        carry = temp >> 32;        temp = uint64_t(aa[0]) * bb[0] + carry;        res[1] = temp & 0xFFFFFFFF;        res[0] = temp >> 32;        return std::make_pair((uint64_t(res[0]) << 32) | res[1], (uint64_t(res[2]) << 32) | res[3] );    }#endif}struct Fixed512{    using Once = boost::multiprecision::int512_t;    using Twice = boost::multiprecision::int1024_t;    Once body;    inline explicit Fixed512(const Once& body) :        body{ body }    {}    using Float256 = boost::multiprecision::number<        boost::multiprecision::backends::cpp_bin_float<            240, boost::multiprecision::backends::digit_base_2, void, boost::int16_t, -16382, 16383>,            boost::multiprecision::et_off>;    using Float512 = boost::multiprecision::number<        boost::multiprecision::backends::cpp_bin_float<            496, boost::multiprecision::backends::digit_base_2, void, boost::int16_t, -16382, 16383>,            boost::multiprecision::et_off>;    inline Fixed512(const Float256& val)    {        body = Once{ val * boost::multiprecision::pow(Float256{ 2 }, 512 - 32) };    }    inline Fixed512(const Float512& val)    {        body = Once{ val * boost::multiprecision::pow(Float512{ 2 }, 512 - 32) };    }    inline Fixed512(double val)    {        body = Once{ boost::multiprecision::pow(Float512{ 2 }, 512 - 32) * val };    }    inline operator Float256(void) const {        return boost::multiprecision::pow(Float256{ 0.5 }, 512 - 32) * Float256{ body };    }    inline operator Float512(void) const {        return boost::multiprecision::pow(Float512{ 0.5 }, 512 - 32) * Float512{ body };    }    inline Fixed512& operator += (const Fixed512& other) {        body += other.body;        return *this;    }    inline Fixed512 operator + (const Fixed512& other) const {        return Fixed512{ body + other.body };    }    inline Fixed512& operator -= (const Fixed512& other) {        body -= other.body;        return *this;    }    inline Fixed512 operator - (const Fixed512& other) const {        return Fixed512{ body - other.body };    }    inline Fixed512 operator * (const Fixed512& other) const {        auto prod = Twice{ this->body } * other.body;        return Fixed512{ Once{ prod >> (512 - 32) } };    }    inline Fixed512& operator *= (const Fixed512& other) {        auto prod = Twice{ this->body } * other.body;        body = Once{ prod >> (512 - 64) };        return *this;    }    inline bool operator > (const Fixed512& other) {        return this->body > other.body;    }};struct Fixed128{    uint64_t upper;    uint64_t lower;    Fixed128(const Fixed128&) = default;    ~Fixed128() = default;    inline Fixed128(uint64_t upper, uint64_t lower) :        upper{ upper }, lower{ lower }    {    }    inline Fixed128(uint32_t a, uint32_t b, uint32_t c, uint32_t d) :        upper{ (uint64_t(a) << 32) | b }, lower{ (uint64_t(c) << 32) | d }    {    }    inline Fixed128(double x)    {        const double twoToThe32 = double(0x100000000ULL);        upper = uint64_t(int64_t(x * twoToThe32));        double remainder = x - double(upper) / twoToThe32;        lower = uint64_t(int64_t(remainder * twoToThe32 * twoToThe32 * twoToThe32));    }    inline Fixed128 operator + (const Fixed128& other) const {        uint64_t lowerAdded = lower + other.lower;        uint64_t upperAdded = upper + other.upper + (lowerAdded < lower);        return Fixed128{ upperAdded, lowerAdded };    }        inline Fixed128& operator +=(const Fixed128& other) {        uint64_t lowerAdded = lower + other.lower;        upper += other.upper + (lowerAdded < lower);        lower = lowerAdded;        return *this;    }    inline Fixed128 operator - (const Fixed128& other) const {        uint64_t lowerSubbed = lower - other.lower;        uint64_t upperSubbed = upper - other.upper - (lowerSubbed > lower);        return Fixed128{ upperSubbed, lowerSubbed };    }    inline Fixed128 operator - (void) const {        return this->operator~() + Fixed128{ 0, 0, 0, 1 };    }    /*//private:    static inline std::pair<uint64_t, uint64_t> mul64(int64_t a, int64_t b) {        int32_t aa[2] = { int32_t(a >> 32), int32_t(a & 0xFFFFFFFF) };        int32_t bb[2] = { int32_t(b >> 32), int32_t(b & 0xFFFFFFFF) };        int32_t res[4];        int64_t temp = int64_t(aa[1]) * bb[1];        res[3] = temp & 0xFFFFFFFF;        int32_t carry = temp >> 32;        temp = int64_t(aa[0]) * bb[1] + int64_t(aa[1]) * bb[0] + carry;        res[2] = temp & 0xFFFFFFFF;        carry = temp >> 32;        temp = int64_t(aa[0]) * bb[0] + carry;        res[1] = temp & 0xFFFFFFFF;        res[0] = temp >> 32;        return std::make_pair(uint64_t((int64_t(res[0]) << 32) | res[1]), uint64_t((int64_t(res[2]) << 32) | res[3]));    }    static inline std::pair<uint64_t, uint64_t> mulu64(uint64_t a, uint64_t b) {        uint32_t aa[2] = { uint32_t(a >> 32), uint32_t(a & 0xFFFFFFFF) };        uint32_t bb[2] = { uint32_t(b >> 32), uint32_t(b & 0xFFFFFFFF) };        uint32_t res[4];        uint64_t temp = uint64_t(aa[1]) * bb[1];        res[3] = temp & 0xFFFFFFFF;        uint32_t carry = temp >> 32;        temp = uint64_t(aa[0]) * bb[1] + uint64_t(aa[1]) * bb[0] + carry;        res[2] = temp & 0xFFFFFFFF;        carry = temp >> 32;        temp = uint64_t(aa[0]) * bb[0] + carry;        res[1] = temp & 0xFFFFFFFF;        res[0] = temp >> 32;        return std::make_pair((uint64_t(res[0]) << 32) | res[1], (uint64_t(res[2]) << 32) | res[3] );    }    */public:    inline Fixed128 operator * (const Fixed128& other) const {        if (this->operator!=(Fixed128{ 0xFFFFFFFFFFFFFFFF, 0xFFFFFFFFFFFFFFFF }) && isNegative()) {            return -(other * this->operator-());        }        if (other.isNegative()) {            return -((-other) * (*this));        }        auto [uuc, uu] = mnd::mulu64(upper, other.upper);        auto [ulc, ul] = mnd::mulu64(upper, other.lower);        auto [luc, lu] = mnd::mulu64(lower, other.upper);        auto [llc, ll] = mnd::mulu64(lower, other.lower);        uint64_t res[4] = { 0, 0, 0, 0 };        res[3] = ll;        res[2] += lu;        res[2] += ul;        if (res[2] < ul)            res[1]++;        res[2] += llc;        if (res[2] < llc)            res[1]++;        res[1] += uu;        if (res[1] < uu)            res[0]++;        res[1] += ulc;        if (res[1] < ulc)            res[0]++;        res[1] += luc;        if (res[1] < luc)            res[0]++;        res[0] += uuc;        return Fixed128{ uint32_t(res[0] & 0xFFFFFFFF), uint32_t(int64_t(res[1]) >> 32), uint32_t(res[1] & 0xFFFFFFFF), uint32_t(int64_t(res[2]) >> 32) };        /*if (isNegative()) {            return -(this->operator-() * other);        }        if (other.isNegative()) {            return -(*this * (-other));        }        bool otherNegative = other.isNegative();        uint32_t quarters[4] = {            (upper >> 32) & 0xFFFFFFFF,            upper & 0xFFFFFFFF,            (lower >> 32) & 0xFFFFFFFF,            lower & 0xFFFFFFFF        };        auto [a, ra] = other.mul(quarters[0]);        auto [b, rb] = other.mul(quarters[1]);        auto [c, rc] = other.mul(quarters[2]);        auto [d, rd] = other.mul(quarters[3]);        b.arshift(1);        c.arshift(2);        d.arshift(3);        Fixed128 carries = { uint32_t(rb), uint32_t(rc), uint32_t(rd), 0 };        Fixed128 result = a + b + c + d + carries;        return result;*/    }    inline std::pair<Fixed128, uint32_t> mul(uint32_t factor) const {        uint32_t quarters[4] = {            uint32_t(upper >> 32) & 0xFFFFFFFF,            uint32_t(upper) & 0xFFFFFFFF,            uint32_t(lower >> 32) & 0xFFFFFFFF,            uint32_t(lower) & 0xFFFFFFFF        };        uint32_t newQ[4];        uint32_t carry = 0;        for (int i = 3; i >= 0; i--) {            int64_t prod = int64_t(quarters[i]) * factor + carry;            newQ[i] = prod & 0xFFFFFFFF;            carry = prod >> 32;        }        /*    newQ[i] = quarters[i] * factor;        uint64_t tempLower = newQ[3];        uint64_t newLower = tempLower + (newQ[2] << 32);        uint64_t newUpper = (newQ[2] >> 32) + newQ[1] + (newQ[0] << 32) + (newLower < tempLower ? 1 : 0);*/        return std::make_pair(Fixed128{ newQ[0], newQ[1], newQ[2], newQ[3] }, carry);    }private:    inline void add(uint64_t val, int b32offset) {        switch (b32offset) {        case 0:            upper += val << 32;            return;        case 1:            upper += val;            return;        case 2:            upper += val >> 32;            lower += val << 32;            return;        case 3: {            uint64_t newLower = lower + val;            if (newLower < lower) upper++;            lower = newLower;            return;        }        case 4:            uint64_t newLower = lower + (val >> 32);            if (lower > newLower) upper++;            lower += newLower;            return;        }    }    inline void addSigned(int64_t val, int b32offset) {        switch (b32offset) {        case 0:            upper += val << 32;            return;        case 1:            upper += val;            return;        case 2:            upper += val >> 32;            lower += val << 32;            return;        case 3:            lower += val;            if (val < 0) upper--;            return;                case 4: {            uint64_t newLower = lower + (val >> 32);            if (lower > newLower) upper++;            lower = newLower;            return;        }        default:            if (val < 0) {                if (lower == 0) upper--;                lower--;            }            return;        }    }public:    inline Fixed128 operator / (const Fixed128& other) {        if (this->operator!=(Fixed128{ 0xFFFFFFFFFFFFFFFF, 0xFFFFFFFFFFFFFFFF }) && isNegative()) {            return -((-(*this)) / other);        }        if (other != Fixed128{ 0xFFFFFFFFFFFFFFFF, 0xFFFFFFFFFFFFFFFF } && other.isNegative()) {            return -((*this) / (-other));        }        using u256 = std::array<uint64_t, 4>;        u256 bigDividend = { upper, lower, 0, 0 };        u256 bigDivisor = { 0, 0, other.upper, other.lower };        auto twice = [] (u256& x) {            bool carry = false;            for (int i = 3; i >= 0; i--) {                bool oldCarry = carry;                carry = x[i] & 0x1000000000000000ULL;                x[i] <<= 1;                if (oldCarry) x[i] ++;            }        };                auto geq = [] (const u256& a, const u256& b) -> bool {            for (int i = 0; i < 4; i++) {                if (a[i] > b[i])                    return true;                if (a[i] < b[i])                    return false;            }            return true;        };        auto sub = [] (u256& a, const u256& b) -> bool {            bool carry = false;            for (int i = 3; i >= 0; i--) {                uint64_t oldA = a[i];                a[i] -= b[i];                carry = oldA < a[i];            }            return carry;        };                auto add = [] (u256& a, const u256& b) -> bool {            bool carry = false;            for (int i = 3; i >= 0; i--) {                uint64_t oldA = a[i];                a[i] += b[i];                carry = oldA > a[i];            }            return carry;        };        u256 growingCount = { 0, 0, 0, 1 };        u256 quotient = { 0, 0, 0, 0 };        std::vector<u256> growingStack = { bigDivisor };        while (true) {            u256 beforeSub = bigDividend;            const u256& gr = growingStack[growingStack.size() - 1];            if (!sub(bigDividend, gr)) {                add(quotient, growingCount);                u256 tw = gr; twice(tw);                growingStack.push_back(tw);            }            else if (geq(bigDivisor, bigDividend)) {                break;            }            else {                bigDividend = beforeSub;                growingStack.pop_back();            }        }        return Fixed128{ quotient[2], quotient[3] };    }    bool isNegative(void) const {        return upper >> 63;    }    operator double(void) const {        const int64_t twoToThe32 = 0x100000000ULL;        return double(int64_t(upper)) / twoToThe32 + int64_t(lower) / twoToThe32 / twoToThe32 / twoToThe32;    }    inline Fixed128 operator ~ (void) const {        return Fixed128{ ~upper, ~lower };    }    inline bool operator == (const Fixed128& other) const {        return upper == other.upper && lower == other.lower;    }    inline bool operator != (const Fixed128& other) const {        return !operator==(other);    }    inline bool operator < (const Fixed128& other) const {        return upper < other.upper || (upper == other.upper && lower < other.lower);    }    inline bool operator <= (const Fixed128& other) const {        return operator<(other) || operator==(other);    }    inline bool operator > (const Fixed128& other) const {        return upper > other.upper || (upper == other.upper && lower > other.lower);    }    inline bool operator >= (const Fixed128& other) const {        return operator>(other) || operator==(other);    }};struct Fixed64{    int64_t bits;    Fixed64(const Fixed64&) = default;    ~Fixed64() = default;    explicit inline Fixed64(int64_t bits, bool /* dummy */) :        bits{ bits }    {    }    inline Fixed64(double x)    {        bits = int64_t(x * (1LL << 48));    }    inline operator float(void) const {        return bits * (1.0f / (1ULL << 48));    }    inline operator double(void) const {        return bits * (1.0 / (1ULL << 48));    }    inline Fixed64 operator + (const Fixed64& other) const {        return Fixed64{ bits + other.bits, true };    }        inline Fixed64& operator +=(const Fixed64& other) {        bits += other.bits;        return *this;    }    inline Fixed64 operator - (const Fixed64& other) const {        return Fixed64{ bits - other.bits, true };    }    inline Fixed64& operator -= (const Fixed64& other) {        bits -= other.bits;        return *this;    }    inline Fixed64 operator * (const Fixed64& other) {        /*int32_t upper = bits >> 32;        uint32_t lower = uint32_t(bits & 0xFFFFFFFF);        int64_t upup = int64_t(upper) * int64_t(upper);        int64_t loup = int64_t(upper) * int64_t(lower);        int64_t lolo = int64_t(lower) * int64_t(lower);        int32_t newUp = upup & 0xFFFFFFFF + (loup >> 32);        int32_t newLo = loup & 0xFFFFFFFF + (lolo >> 32);*/        /*double d = int32_t(bits >> 32) + double(uint32_t(bits)) / (1ULL << 32);        double od = int32_t(other.bits >> 32) + double(uint32_t(other.bits)) / (1ULL << 32);        return d * od;*/#if defined(__SIZEOF_INT128__)        __int128_t m = __int128_t(bits) * __int128_t(other.bits);        return Fixed64{ int64_t(m >> 48), true };#else        auto[hi, lo] = mnd::mul64(bits, other.bits);        return Fixed64{ int64_t((hi << 16) | (lo >> 48)), true };#endif        /*uint32_t a[2] = { uint32_t(uint64_t(bits) >> 32), uint32_t(bits & 0xFFFFFFFF) };        uint32_t b[2] = { uint32_t(uint64_t(other.bits) >> 32), uint32_t(other.bits & 0xFFFFFFFF) };        uint64_t a1b1 = uint64_t(a[1]) * b[1];        int64_t a0b1 = int64_t(int32_t(a[0])) * uint64_t(b[1]);        int64_t a1b0 = uint64_t(a[1]) * int64_t(int32_t(b[1]));        int64_t a0b0 = int64_t(int32_t(a[1])) * int64_t(int32_t(b[1]));        int64_t res = a1b1 >> 32;        res += a0b1 + a1b0;        res += a0b0 << 32;        return Fixed64{ res, true };*/        /*        uint32_t aa[2] = { uint32_t(uint64_t(bits) >> 32), uint32_t(bits & 0xFFFFFFFF) };        uint32_t bb[2] = { uint32_t(uint64_t(other.bits) >> 32), uint32_t(other.bits & 0xFFFFFFFF) };        uint64_t ab0[2] = { 0, 0 };        ab[1] = int64_t(int32_t(aa[1]) * int32_t(ab[0]));        ab[0] = int64_t(int32_t(aa[0]) * int32_t(ab[0]));        uint64_t ab1[2] = { 0, 0 };        ab[1] = aa[1] * ab[1];        ab[0] = int64_t(int32_t(aa[1]) * int32_t(ab[0]));        */        /*        boost::multiprecision::int128_t a(this->bits);        boost::multiprecision::int128_t b(other.bits);        return Fixed64{ int64_t((a * b) >> 32), true };        */        //return Fixed64{ (uint64_t(newUp) << 32) | newLo, true };    }    inline bool operator == (const Fixed64& other) {        return bits == other.bits;    }    inline bool operator != (const Fixed64& other) {        return !operator==(other);    }    inline bool operator < (const Fixed64& other) {        return bits < other.bits;    }    inline bool operator <= (const Fixed64& other) {        return operator<(other) || operator==(other);    }    inline bool operator > (const Fixed64& other) {        return bits > other.bits;    }    inline bool operator >= (const Fixed64& other) {        return operator>(other) || operator==(other);    }};struct Fixed32{    int32_t bits;    Fixed32(const Fixed32&) = default;    ~Fixed32() = default;    inline Fixed32(int32_t bits, bool) :        bits{ bits }    {    }    inline Fixed32(double x)    {        int integerPart = int(::floor(x));        double fractionalPart = x - integerPart;        /*if (x < 0) {            integerPart--;            fractionalPart = 1.0 - fractionalPart;        }*/        bits = int32_t(integerPart) << 16;        bits |= uint32_t(fractionalPart * (1ULL << 16)) & 0xFFFF;    }    inline Fixed32 operator + (const Fixed32& other) {        return Fixed32{ bits + other.bits, true };    }        inline Fixed32& operator +=(const Fixed32& other) {        bits += other.bits;        return *this;    }    inline Fixed32 operator - (const Fixed32& other) {        return Fixed32{ bits - other.bits, true };    }    inline Fixed32 operator * (const Fixed32& other) {        int64_t prod = int64_t(bits) * int64_t(other.bits);        return Fixed32{ int32_t(prod >> 16), true };        //return Fixed32{ (uint64_t(newUp) << 32) | newLo, true };    }    inline bool operator == (const Fixed32& other) {        return bits == other.bits;    }    inline bool operator != (const Fixed32& other) {        return !operator==(other);    }    inline bool operator < (const Fixed32& other) {        return bits < other.bits;    }    inline bool operator <= (const Fixed32& other) {        return operator<(other) || operator==(other);    }    inline bool operator > (const Fixed32& other) {        return bits > other.bits;    }    inline bool operator >= (const Fixed32& other) {        return operator>(other) || operator==(other);    }};#endif // MANDEL_FIXED128_H
 |