// Copyright Ryan Scott White. 2020, 2021, 2022, 2023, 2024 // Released under the MIT License. Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sub-license, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: // The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. // This struct was written by human hand. This may change soon. using System; using System.Diagnostics; using System.Diagnostics.CodeAnalysis; using System.Globalization; using System.Numerics; using System.Text; using static System.Runtime.InteropServices.JavaScript.JSType; namespace BigFloatLibrary; // for notes on zero see "BigFloatZeroNotes.txt" // Considerations when naming this class // BigFloat : This would indicate a number with a floating decimal point. This describes this class. // BigRational: This indicates the faction part stored as an actual fraction (Numerator/Denominator). // BigDecimal: This indicates processing/storage is base-10. However, this class is base-2 based. ///

/// BigFloat stores a BigInteger with a floating decimal point. ///

[DebuggerDisplay("{DebuggerDisplay}")] public readonly partial struct BigFloat : IComparable, IComparable, IEquatable { ///

/// ExtraHiddenBits helps with precision by keeping an extra 32 bits. ExtraHiddenBits are a fixed amount of least-signification sub-precise bits. /// These bits helps guard against some nuisances such as "7" * "9" being 60. ///

public const int ExtraHiddenBits = 32; // 0-62, must be even (for sqrt) ///

/// Gets the full integer with the hidden bits. ///

public readonly BigInteger DataBits { get; } ///

/// _size are the number of precision bits. It is equal to "ABS(_int).GetBitLength()". The ABS is for /// power-of-two negative BigIntegers (-1,-2,-4,-8...) so it is the same whether positive or negative. /// _size INCLUDES ExtraHiddenBits (the Property Size subtracts out ExtraHiddenBits) /// _size does not include rounding from ExtraHiddenBits. (11[111...111] (where [111...111] is ExtraHiddenBits) is still 2 bits. So the user will see it as 0b100 with a size of 2.) /// _size is 0 only when '_int==0' /// When BigFloat is Zero, the size is zero. ///

internal readonly int _size; // { get; init; } //future: Possible future feature /////

///// When positive, it's the number of least significant digits in DataBits that repeat. ///// Example: DataBits:11.001(with _extraPrecOrRepeat = 3) would be 11.001001001001... ///// When negative, it is the number of extra virtual zeros tacked on the end of the internal _int for better precision and accuracy. ///// Example: 11.001(with _extraPrecOrRepeat = -3) would be the same as 11.001000 ///// For the above example "000" would not take up any space and is also guaranteed to be all 0 bits. ///// When zero, this feature does not get used. (Default) /////

// private readonly int _extraPrecOrRepeat; ///

/// The Scale (or -Accuracy) is the amount to left shift (<<) the integer (or right shift the radix point) to get to the desired value. /// When BigFloat is Zero, scale is the point of least accuracy. /// note: _scale = Scale-ExtraHiddenBits (or Scale = _scale + ExtraHiddenBits) ///

public readonly int Scale { get; init; } ///

/// The Size is the precision. It in number of bits required to hold the number. /// ExtraHiddenBits are subtracted out. ///

public readonly int Size => Math.Max(0, _size - ExtraHiddenBits); ///

/// The number of data bits. ExtraHiddenBits are counted. ///

public readonly int SizeWithHiddenBits => _size; ///

/// The resulting binary point position when counting from the most significant bit. /// Or where the [.]dataBits x 2^exp. Example: 0.11010 x 2^3 = 110.10 [Scale + Size] /// Examples: 0.11 -> 0; 1.11 -> 1; 10.1 -> 2; .001 = -2 ///

public int Exponent => Scale + _size - ExtraHiddenBits; //see BigFloatZeroNotes.txt for notes //perf: should we keep the shortcut "...&& Scale < 0 &&..."? ///

/// Returns true if the internal data bits round to zero. ///

public bool IsZero => _size < (ExtraHiddenBits - 2) && (_size + Scale) < ExtraHiddenBits; // && Scale < 0 // What is considered Zero: any dataInt that is LESS then 0:100000000, and also the shift results in a 0:100000000. // // IntData Scale Size Sz+Sc Precision Zero // 1:111111111 << -2 33 31 1 N // 1:000000000 << -2 33 31 1 N // 1:000000000 << -1 33 32 1 N // 1:000000000 << 0 33 33 1 N // 0:111111111 << -1 32 31 0 N // 0:100000000 << -1 32 31 0 N // 0:100000000 << 0 32 32 0 N // 0:011111111 << -1 31 30 -1 Y // 0:011111111 << 0 31 31 -1 Y (borderline) // 0:011111111 << 1 31 32 -1 N // 0:001111111 << 1 31 32 -2 Y (borderline) // 0:001111111 << 2 31 33 -2 N ///

/// Returns true if there is less than 1 bit of precision. However, a false value does not guarantee that the number are precise. ///

public bool OutOfPrecision => _size < ExtraHiddenBits; ///

/// Returns the precision of the BigFloat. This is the same as the size of the data bits. The precision can be zero or negative. A negative precision means the number is below the number of bits(HiddenBits) that are deemed precise. ///

public int GetPrecision => _size - ExtraHiddenBits; ///

/// Returns the accuracy of the BigFloat. The accuracy is equivalent to the opposite of the scale. A negative accuracy means the least significant bit is above the one place. A value of zero is equivalent to an integer. A positive value is the number of accurate decimal places(in binary) the number has. ///

public int GetAccuracy => -Scale; ///

/// Rounds and returns true if this value is positive. Zero is not considered positive or negative. Only the top bit in ExtraHiddenBits is counted. ///

public bool IsPositive => Sign > 0; ///

/// Rounds and returns true if this value is negative. Only the top bit in ExtraHiddenBits is counted. ///

public bool IsNegative => Sign < 0; ///

/// Rounds and returns -1 if negative, 0 if zero, and +1 if positive. Only the top bit in ExtraHiddenBits and top out-of-precision hidden bit are included. ///

public int Sign => (_size >= ExtraHiddenBits - 1) ? DataBits.Sign : 0; ///

/// Gets the integer part of the BigFloat. No scaling is applied. ExtraHiddenBits are rounded and removed. ///

public readonly BigInteger Int => DataIntValueWithRound(DataBits); public string DebuggerDisplay { get { string bottom8HexChars = (BigInteger.Abs(DataBits) & ((BigInteger.One << ExtraHiddenBits) - 1)).ToString("X8").PadLeft(8)[^8..]; StringBuilder sb = new(32); _ = sb.Append($"{ToString(true)}, "); // integer part using ToString() _ = sb.Append($"{(DataBits.Sign >= 0 ? " " : "-")}0x{BigInteger.Abs(DataBits) >> ExtraHiddenBits:X}:{bottom8HexChars}"); // hex part _ = sb.Append($"[{Size}+{ExtraHiddenBits}={_size}], {((Scale >= 0) ? "<<" : ">>")} {Math.Abs(Scale)}"); return sb.ToString(); } } ///

/// Prints debug information for the BigFloat to the console. ///

/// Prints an optional name of the variable. public void DebugPrint(string varName = null) { string shift = $"{((Scale >= 0) ? "<<" : ">>")} {Math.Abs(Scale)}"; if (!string.IsNullOrEmpty(varName)) { Console.WriteLine($"{varName + ":"}"); } Console.WriteLine($" Debug : {DebuggerDisplay}"); Console.WriteLine($" String : {ToString()}"); //Console.WriteLine($" Int|hex: {_int >> ExtraHiddenBits:X}:{(_int & (uint.MaxValue)).ToString("X")[^8..]}[{Size}] {shift} (Hidden-bits round {(WouldRound() ? "up" : "down")})"); Console.WriteLine($" Int|Hex : {ToStringHexScientific(true, true, false)} (Hidden-bits round {(WouldRound() ? "up" : "down")})"); Console.WriteLine($" |Hex : {ToStringHexScientific(true, true, true)} (two's comp)"); Console.WriteLine($" |Dec : {DataBits >> ExtraHiddenBits}{((double)(DataBits & (((ulong)1 << ExtraHiddenBits) - 1)) / ((ulong)1 << ExtraHiddenBits)).ToString()[1..]} {shift}"); Console.WriteLine($" |Dec : {DataBits >> ExtraHiddenBits}:{DataBits & (((ulong)1 << ExtraHiddenBits) - 1)} {shift}"); // decimal part (e.g. .75) if (DataBits < 0) { Console.WriteLine($" or -{-DataBits >> ExtraHiddenBits:X4}:{(-DataBits & (((ulong)1 << ExtraHiddenBits) - 1)).ToString("X8")[^8..]}"); } Console.WriteLine($" |_int: {DataBits}"); Console.WriteLine($" Scale : {Scale}"); Console.WriteLine(); } ///

/// Returns a Zero with no size/precision. ///

public static BigFloat ZeroWithNoPrecision => new(0, 0, 0); ///

/// Returns a Zero with a given lower bound of precision. Example: -4 would result of 0.0000(in binary). ExtraHiddenBits will be added. ///

/// The precision can be positive or negative. public static BigFloat ZeroWithSpecifiedLeastPrecision(int pointOfLeastPrecision) { return new(BigInteger.Zero, pointOfLeastPrecision, 0); } ///

/// Returns a '1' with only 1 bit of precision. (1 << ExtraHiddenBits) ///

public static BigFloat One => new(BigInteger.One << ExtraHiddenBits, 0, ExtraHiddenBits + 1); ///

/// Returns a "1" with additional Accuracy. This is beyond the ExtraHiddenBits. ///

/// The precision between -32(ExtraHiddenBits) to Int.MaxValue. public static BigFloat OneWithAccuracy(int precisionInBits) { // if the precision is shrunk to a size of zero it cannot contain any data bits return precisionInBits <= -ExtraHiddenBits ? ZeroWithNoPrecision : new(BigInteger.One << (ExtraHiddenBits + precisionInBits), -precisionInBits, ExtraHiddenBits + 1 + precisionInBits); // alternative: throw new ArgumentException("The requested precision would leave not leave any bits."); } ///

/// Returns an integer with additional accuracy. This is beyond the ExtraHiddenBits. ///

/// The precision between (-ExtraHiddenBits - intVal.BitSize) to Int.MaxValue. public static BigFloat IntWithAccuracy(BigInteger intVal, int precisionInBits) { int intSize = (int)BigInteger.Abs(intVal).GetBitLength(); // if the precision is shrunk to a size of zero it cannot contain any data bits return precisionInBits < -(ExtraHiddenBits + intSize) ? ZeroWithNoPrecision : new(intVal << (ExtraHiddenBits + precisionInBits), -precisionInBits, ExtraHiddenBits + intSize + precisionInBits); // alternative: throw new ArgumentException("The requested precision would leave not leave any bits."); } ///

/// Returns an integer with additional accuracy. This is beyond the ExtraHiddenBits. ///

/// The precision between (-ExtraHiddenBits - intVal.BitSize) to Int.MaxValue. public static BigFloat IntWithAccuracy(int intVal, int precisionInBits) { int size = int.Log2(int.Abs(intVal)) + 1 + ExtraHiddenBits; return precisionInBits < -size ? ZeroWithNoPrecision : new(((BigInteger)intVal) << (ExtraHiddenBits + precisionInBits), -precisionInBits, size + precisionInBits); } public static BigFloat NegativeOne => new(BigInteger.MinusOne << ExtraHiddenBits, 0, ExtraHiddenBits + 1); ///////////////////////// INIT / CONVERSION FUNCTIONS ///////////////////////// ///

/// Contracts a BigFloat using the raw elemental parts. The user is responsible to pre-up-shift rawValue and set and . ///

/// The raw integerPart. It should INCLUDE the ExtraHiddenBits. /// The size of rawValue. private BigFloat(BigInteger rawValue, int scale, int rawValueSize) { DataBits = rawValue; Scale = scale; _size = rawValueSize; AssertValid(); } ///

/// Constructs a BigFloat using its elemental parts. ///

/// The integer part of the BigFloat that will have a applied to it. /// How much should the be shifted or scaled? This shift (base-2 exponent) will be applied to the . /// if true, then the hidden bits should be included in the integer part. public BigFloat(BigInteger integerPart, int scale = 0, bool valueIncludesHiddenBits = false) { int applyHiddenBits = valueIncludesHiddenBits ? 0 : ExtraHiddenBits; // we need Abs() so items that are a negative power of 2 has the same size as the positive version. DataBits = integerPart << applyHiddenBits; _size = (int)BigInteger.Abs(DataBits).GetBitLength(); Scale = scale; // _int of zero can have scale AssertValid(); } public BigFloat(char integerPart, int scale = 0) { DataBits = (BigInteger)integerPart << ExtraHiddenBits; Scale = scale; // Special handing required for int.MinValue _size = integerPart >= 0 ? integerPart == 0 ? 0 : BitOperations.Log2(integerPart) + 1 + ExtraHiddenBits : integerPart != char.MinValue ? integerPart == 0 ? 0 : BitOperations.Log2((byte)-integerPart) + 1 + ExtraHiddenBits : 7 + ExtraHiddenBits; AssertValid(); } public BigFloat(byte integerPart, int scale = 0) { DataBits = (BigInteger)integerPart << ExtraHiddenBits; Scale = scale; _size = integerPart == 0 ? 0 : BitOperations.Log2(integerPart) + 1 + ExtraHiddenBits; AssertValid(); } public BigFloat(int integerPart, int scale = 0) : this((long)integerPart, scale) { } public BigFloat(uint value, int scale = 0) { DataBits = (BigInteger)value << ExtraHiddenBits; Scale = scale; _size = value == 0 ? 0 : BitOperations.Log2(value) + 1 + ExtraHiddenBits; AssertValid(); } public BigFloat(long value, int scale = 0) { DataBits = (BigInteger)value << ExtraHiddenBits; Scale = scale; _size = value switch { > 0 => BitOperations.Log2((ulong)value) + 1 + ExtraHiddenBits, < 0 => 64 - BitOperations.LeadingZeroCount(~((ulong)value - 1)) + ExtraHiddenBits, _ => 0, }; AssertValid(); } public BigFloat(ulong value, int scale = 0) { DataBits = (BigInteger)value << ExtraHiddenBits; Scale = scale; _size = value == 0 ? 0 : BitOperations.Log2(value) + 1 + ExtraHiddenBits; AssertValid(); } public BigFloat(Int128 integerPart, int scale = 0) { DataBits = (BigInteger)integerPart << ExtraHiddenBits; Scale = scale; _size = integerPart > Int128.Zero ? (int)Int128.Log2(integerPart) + 1 + ExtraHiddenBits : integerPart < Int128.Zero ? 128 - (int)Int128.LeadingZeroCount(~(integerPart - 1)) + ExtraHiddenBits : 0; AssertValid(); } public BigFloat(Int128 integerPart, int scale, bool valueIncludesHiddenBits) { DataBits = (BigInteger)integerPart << ExtraHiddenBits; Scale = scale; _size = integerPart > Int128.Zero ? (int)Int128.Log2(integerPart) + 1 + ExtraHiddenBits : integerPart < Int128.Zero ? 128 - (int)Int128.LeadingZeroCount(~(integerPart - 1)) + ExtraHiddenBits : 0; AssertValid(); int applyHiddenBits = valueIncludesHiddenBits ? 0 : ExtraHiddenBits; // we need Abs() so items that are a negative power of 2 has the same size as the positive version. _size = (int)((BigInteger)(integerPart >= 0 ? integerPart : -integerPart)).GetBitLength() + applyHiddenBits; DataBits = integerPart << applyHiddenBits; Scale = scale; // _int of zero can have scale AssertValid(); } public BigFloat(double value, int additionalScale = 0) { long bits = BitConverter.DoubleToInt64Bits(value); long mantissa = bits & 0xfffffffffffffL; int exp = (int)((bits >> 52) & 0x7ffL); if (exp == 2047) // 2047 represents inf or NAN { //if (double.IsNaN(value)) //{ // _int = 0; // Scale = scale; // _size = 0; // return; //} //if (double.IsInfinity(value)) //{ // ThrowInitializeException(); //} ThrowInitializeException(); // mantissa==0 is Inf else NAN } else if (exp != 0) { mantissa |= 0x10000000000000L; if (value < 0) { mantissa = -mantissa; } DataBits = new BigInteger(mantissa) << ExtraHiddenBits; Scale = exp - 1023 - 52 + additionalScale; _size = 53 + ExtraHiddenBits; //_size = BitOperations.Log2((ulong)Int); } else // exp is 0 so this is a denormalized float (leading "1" is "0" instead) { // 0:00000000000:00...0001 -> smallest value (Epsilon) Int:1, Scale: Size:1 // ... if (mantissa == 0) { DataBits = 0; Scale = additionalScale; _size = 0; } else { int size = 64 - BitOperations.LeadingZeroCount((ulong)mantissa); if (value < 0) { mantissa = -mantissa; } DataBits = (new BigInteger(mantissa)) << (ExtraHiddenBits); Scale = -1023 - 52 + 1 + additionalScale; _size = size + ExtraHiddenBits; } } AssertValid(); } public BigFloat(float value, int additionalScale = 0) { int bits = BitConverter.SingleToInt32Bits(value); int mantissa = bits & 0x007fffff; int exp = (int)((bits >> 23) & 0xffL); if (exp != 0) { if (exp == 255) { //special values //if (float.IsNaN(value)) //{ // _int = 0; // Scale = scale; // _size = 0; // return; //} //if (float.IsInfinity(value)) //{ // ThrowInitializeException(); //} ThrowInitializeException(); // mantissa==0 is Inf else NAN } // Add leading 1 bit mantissa |= 0x800000; if (value < 0) { mantissa = -mantissa; } DataBits = new BigInteger(mantissa) << ExtraHiddenBits; Scale = exp - 127 - 23 + additionalScale; _size = 24 + ExtraHiddenBits; } else // exp is 0 so this is a denormalized(Subnormal) float (leading "1" is "0" instead) { if (mantissa == 0) { DataBits = 0; Scale = additionalScale; _size = 0; //24 + ExtraHiddenBits; } else { BigInteger mant = new(value >= 0 ? mantissa : -mantissa); DataBits = mant << ExtraHiddenBits; Scale = -126 - 23 + additionalScale; //hack: 23 is a guess _size = 32 - BitOperations.LeadingZeroCount((uint)mantissa) + ExtraHiddenBits; } } AssertValid(); } [DoesNotReturn] private static void ThrowInitializeException() { throw new OverflowException("Value was too large for a BigFloat."); } ///

/// Parses an input string and returns a BigFloat. If it fails, an exception is thrown. /// This function supports: /// - Positive or negative leading signs or no sign. /// - Radix point (aka. decimal point for base 10) /// - Hex strings starting with a [-,+,_]0x (radix point and sign supported) /// - Binary strings starting with a [-,+,_]0b (radix point and sign supported) ///

/// The input decimal/hex/binary number. /// Optional apply positive or negative base-2 scaling.(default is zero) public BigFloat(string value, int additionalScale = 0) { this = Parse(value, additionalScale); } ///////////////////////// [END] INIT / CONVERSION FUNCTIONS [END] ///////////////////////// //////////////////////////////////////////////////////////////////////////////////////////// /////////////////////////////// TO_STRING FUNCTIONS //////////////////////////////// //////////////////////////////////////////////////////////////////////////////////////////// // see "BigFloatToStringNotes.txt" and "BigFloatTryParseNotes.txt" for additional notes // string ToString() - calls ToStringDecimal() // string ToString(string format) - to Hex(e.g. A4B.F2) and Binary(e.g. 1010111.001) // string ToStringDecimal() - To Decimal, e.g. 9999.99 // string ToStringHexScientific(bool showHiddenBits = false, bool showSize = false, bool showInTwosComplement = false) - e.g. "12AC<<22" [DebuggerHidden()] public override string ToString() { return ToStringDecimal(this, false); } [DebuggerHidden()] public string ToString(bool includeOutOfPrecisionBits = false) { return ToStringDecimal(this, includeOutOfPrecisionBits); } ///

/// Format the value of the current instance to a decimal number. ///

/// The BigFloat that should be converted to a string. /// Include out-of-precision bits in result. This will include additional decimal places. //[DebuggerHidden()] public static string ToStringDecimal(BigFloat val, bool includeOutOfPrecisionBits = false) { BigInteger intVal = val.DataBits; int scale = val.Scale; int valSize = val._size; if (includeOutOfPrecisionBits) { intVal <<= ExtraHiddenBits; scale -= ExtraHiddenBits; valSize += ExtraHiddenBits; } if (scale < -1) { // Number will have a decimal point. (e.g. 222.22, 0.01, 3.1) // -1 is not enough to form a full decimal digit. // Get the number of places that should be returned after the decimal point. int decimalDigits = -(int)((scale - 1.5) / 3.32192809488736235); BigInteger power5 = BigInteger.Abs(intVal) * BigInteger.Pow(5, decimalDigits); // Applies the scale to the number and rounds from bottom bit BigInteger power5Scaled = RightShiftWithRound(power5, -scale - decimalDigits + ExtraHiddenBits); // If zero, then special handling required. Add as many precision zeros based on scale. if (power5Scaled.IsZero) { if (RightShiftWithRound(intVal, ExtraHiddenBits).IsZero) { return $"0.{new string('0', decimalDigits)}"; } // future: The below should not be needed. //// solves an issue when a "BigFloat(1, -8)" being 0.000 decimalDigits++; power5 = BigInteger.Abs(intVal) * BigInteger.Pow(5, decimalDigits); power5Scaled = RightShiftWithRound(power5, -scale - decimalDigits + ExtraHiddenBits); } string numberText = power5Scaled.ToString(); int decimalOffset = numberText.Length - decimalDigits; //int decimalOffset2 = ((int)((_size - ExtraHiddenBits + scale2) / 3.32192809488736235)) - ((numberText[0] - '5') / 8.0); //alternative if (decimalOffset < -10) // 0.0000000000xxxxx { return $"{(intVal.Sign < 0 ? "-" : "")}{numberText}e-{decimalDigits}"; } int exponent = scale + valSize - ExtraHiddenBits; // The length should have room for: [-][digits][.][digits] int length = (intVal < 0 ? 3 : 2) + numberText.Length - (exponent <= 0 ? decimalOffset : 1); char[] chars = new char[length]; int position = 0; if (intVal < 0) { chars[position++] = '-'; } // 0.#### or 0.000##### - lets check for these formats // We can round a 0.99 to a 1.00, hence the "(Exponent==0 && decimalOffset <= 0)" if (exponent < 0 || (exponent == 0 && decimalOffset <= 0)) { chars[position++] = '0'; chars[position++] = '.'; for (int i = decimalOffset; i < 0; i++) { chars[position++] = '0'; } numberText.CopyTo(0, chars, position, numberText.Length); return new string(chars); } // ####.##### - at this point it must be this format numberText.CopyTo(0, chars, position, decimalOffset); position += decimalOffset; chars[position++] = '.'; numberText.CopyTo(decimalOffset, chars, position, decimalDigits); return new string(chars); } // Check to see if we have an integer, if so no Pow(5) scaling required if (scale == 0) { return DataIntValueWithRound(intVal).ToString(); } // At this point we the number have a positive exponent. e.g 7XXXXX or 7e+10 (no decimal point) int maskSize = (int)((scale + 2.5) / 3.32192809488736235); // 2.5 is adjustable BigInteger resUnScaled = (intVal << (scale - maskSize)) / BigInteger.Pow(5, maskSize); // Applies the scale to the number and rounds from bottom bit BigInteger resScaled = RightShiftWithRound(resUnScaled, ExtraHiddenBits); // Let put together the string. StringBuilder result = new(); result.Append(resScaled); if (maskSize > 10) { result.Append("e+"); result.Append(maskSize); } else { result.Append(new string('X', maskSize)); } return result.ToString(); } ///

/// Writes a BigFloat in Hex('X') or Binary('B'). A radix point is supported. Negative values must have a leading '-'. ///

/// Format specifier: 'X' for hex, 'B' for binary, or empty for decimal. /// The value as a string. public string ToString(string format) { if (string.IsNullOrEmpty(format)) { return ToString(); } //// Lets round and remove the ExtraHiddenBits now. //BigInteger newInt = DataIntValueWithRound(BigInteger.Abs(_int), out bool needToRound); //int size = (int)newInt.GetBitLength(); //int newScale = Scale; if (format[0] == 'X') //hex with radix point { if (Scale >= 0) { //return (newInt >> Scale).ToString("X"); return (DataBits >> (ExtraHiddenBits - Scale)).ToString("X"); // This version includes hidden bits in result } // We have to align the INT to the nearest 4 bits for hex. We also want to remove the ExtraHiddenBits. // The number of bits between the radix point and the end should be divisible by 4. We will dig into the ExtraHiddenBits for this. int rightShift = (ExtraHiddenBits - Scale) & 0x03; BigInteger shiftedBigIntForDisplay = RightShiftWithRound(DataBits, rightShift); return shiftedBigIntForDisplay.ToString("X").Insert((-Scale / 4) - 1, "."); } if (format[0] == 'B') // Signals a binary (with radix point) { // Setup destination and allocate memory Span dstBytes = stackalloc char[_size - ExtraHiddenBits + Math.Max(Math.Max(Scale, -(_size - ExtraHiddenBits) - Scale), 0) // total number of out-of-precision zeros in the output. + (DataBits.Sign < 0 ? 1 : 0) // add one if a leading '-' sign (-0.1) + (Scale < 0 ? 1 : 0) // add one if it has a point like (1.1) + (Exponent <= 0 ? 1 : 0)]; // add one if <1 for leading Zero (0.1) int dstIndex = 0; // Three types // Type '12300' - if all bits are to the left of the radix point(no radix point required) // Type '12.30' - has numbers below AND above the point. (e.g. 11.01) // Type '0.123' - all numbers are to the right of the radix point. (has leading 0.or - 0.) // Pre-append the leading sign. if (DataBits.Sign < 0) { dstBytes[dstIndex] = '-'; dstIndex++; } // Setup source bits to read. ReadOnlySpan srcBytes = DataIntValueWithRound(BigInteger.Abs(DataBits)).ToByteArray(); int leadingZeroCount = BitOperations.LeadingZeroCount(srcBytes[^1]) - 24; if (Exponent <= 0) // For binary numbers less then one. (e.g. 0.001101) { int outputZerosBetweenPointAndNumber = Math.Max(0, -(_size - ExtraHiddenBits) - Scale); dstBytes[dstIndex++] = '0'; dstBytes[dstIndex++] = '.'; // Add the leading zeros for (int i = 0; i < outputZerosBetweenPointAndNumber; i++) { dstBytes[dstIndex++] = '0'; } WriteValueBits(srcBytes, leadingZeroCount, Size, dstBytes[dstIndex..]); } else if (Scale >= 0) // For binary numbers with no radix point. (e.g. 1101) { int outputZerosBetweenNumberAndPoint = Math.Max(0, Scale); dstBytes[^outputZerosBetweenNumberAndPoint..].Fill('0'); WriteValueBits(srcBytes, leadingZeroCount, Size, dstBytes[dstIndex..]); } else // For numbers with a radix point in the middle (e.g. 101.1 or 10.01, or 1.00) { int outputBitsBeforePoint = _size - ExtraHiddenBits + Scale; int outputBitsAfterPoint = Math.Max(0, -Scale); WriteValueBits(srcBytes, leadingZeroCount, outputBitsBeforePoint, dstBytes[dstIndex..]); dstIndex += outputBitsBeforePoint; //Write Decimal point dstBytes[dstIndex++] = '.'; WriteValueBits(srcBytes, leadingZeroCount + outputBitsBeforePoint, outputBitsAfterPoint, dstBytes[dstIndex..]); } return new string(dstBytes); } // If none of the above formats ('X' or 'B') matched, then fail. throw new FormatException($"The {format} format string is not supported."); static void WriteValueBits(ReadOnlySpan srcBytes, int bitStart, int bitCount, Span dstBytes) { int srcLoc = srcBytes.Length - 1; int dstByte = 0; int cur = bitStart; while (cur < bitStart + bitCount) { int curSrcByte = srcLoc - (cur >> 3); int curSrcBit = 7 - (cur & 0x7); byte b2 = srcBytes[curSrcByte]; dstBytes[dstByte++] = (char)('0' + ((b2 >> curSrcBit) & 1)); cur++; } } } ///

/// Generates the data-bits in hex followed by the amount to shift(in decimal). Example: 12AC<<22 or B1>>3 ///

/// Includes the extra 32 hidden bits. Example: 12AC:F0F00000<<22 /// Appends a [##] to the number with it's size in bits. Example: 22AC[14]<<22 /// When enabled, shows the show result in two's complement form with no leading sign. Example: -5 --> B[3]<<0 public string ToStringHexScientific(bool showHiddenBits = false, bool showSize = false, bool showInTwosComplement = false) { StringBuilder sb = new(); BigInteger intVal = DataBits; if (!showInTwosComplement && DataBits.Sign < 0) { _ = sb.Append('-'); intVal = -intVal; } _ = sb.Append($"{intVal >> ExtraHiddenBits:X}"); if (showHiddenBits) { _ = sb.Append($":{(intVal & (uint.MaxValue)).ToString("X8")[^8..]}"); } if (showSize) { _ = sb.Append($"[{Size}]"); } _ = sb.Append($" {((Scale >= 0) ? "<<" : ">>")} {Math.Abs(Scale)}"); return sb.ToString(); } ///

/// A high performance BigInteger to binary string converter that supports 0 and negative numbers. /// Negative numbers are returned with a leading '-' sign. ///

private static void BigIntegerToBinarySpan(BigInteger x, ref Span dstBytes) { bool isNegitive = x.Sign < 0; if (isNegitive) { x = -x; } // Setup source ReadOnlySpan srcBytes = x.ToByteArray(); int srcLoc = srcBytes.Length - 1; // Find the first bit set in the first byte so we don't print extra zeros. int msb = BitOperations.Log2(srcBytes[srcLoc]); // Setup Target //Span dstBytes = stackalloc char[srcByte * 8 + MSB + 2]; int dstLoc = 0; // Add leading '-' sign if negative. if (isNegitive) { dstBytes[dstLoc++] = '-'; } // The first byte is special because we don't want to print leading zeros. byte b = srcBytes[srcLoc--]; for (int j = msb; j >= 0; j--) { dstBytes[dstLoc++] = (char)('0' + ((b >> j) & 1)); } // Add the remaining bits. for (; srcLoc >= 0; srcLoc--) { byte b2 = srcBytes[srcLoc]; for (int j = 7; j >= 0; j--) { dstBytes[dstLoc++] = (char)('0' + ((b2 >> j) & 1)); } } } ///

/// A high performance BigInteger to binary string converter that supports 0 and negative numbers. /// Negative numbers will be returned as two's complement with no sign. /// The output char[] size will be a multiple of 8. ///

private static void BigIntegerToBinarySpanTwosComplement(BigInteger x, ref Span dstBytes) { // Setup source ReadOnlySpan srcBytes = x.ToByteArray(); int srcLoc = srcBytes.Length - 1; // Setup Target int dstLoc = 0; // Add the remaining bits. for (; srcLoc >= 0; srcLoc--) { byte b2 = srcBytes[srcLoc]; for (int j = 7; j >= 0; j--) { dstBytes[dstLoc++] = (char)('0' + ((b2 >> j) & 1)); } } } private static string BigIntegerToBinaryString(BigInteger x, bool twosComplement = false) { if (twosComplement) { Span charsSpan = stackalloc char[(int)x.GetBitLength() + 7]; //char[] chars = new char[x.GetBitLength() + 2]; //Span charsSpan = new(chars); BigIntegerToBinarySpanTwosComplement(x, ref charsSpan); return new string(charsSpan); } else { Span charsSpan = stackalloc char[(int)x.GetBitLength() + ((x < 0) ? 2 : 1)]; //char[] chars = new char[x.GetBitLength() + ((x < 0) ? 1 : 0)]; //Span charsSpan = new(chars); BigIntegerToBinarySpan(x, ref charsSpan); return new string(charsSpan); } } ///

/// This function returns a specified number of most-significant bits (MSBs) as a char[] array. If the requested number of bits is larger than the data bits, it will be left-shifted and padded with underscores. ///

public string GetMostSignificantBits(int numberOfBits) { BigInteger abs = BigInteger.Abs(DataBits); int shiftAmount = _size - numberOfBits; return shiftAmount >= 0 ? BigIntegerToBinaryString(abs >> shiftAmount) : BigIntegerToBinaryString(abs) + new string('_', -shiftAmount); } ///

/// Returns the value's bits, including hidden bits, as a string. /// Negative values will have a leading '-' sign. ///

public string GetAllBitsAsString(bool twosComplement = false) { return BigIntegerToBinaryString(DataBits, twosComplement); } ///

/// Returns the value's bits as a string. /// Negative values will have a leading '-' sign. ///

public string GetBitsAsString() { return BigIntegerToBinaryString(Int); } /////////////////////////// [END] TO_STRING FUNCTIONS [END] //////////////////////////////// //////////////////////////////////////////////////////////////////////////////////////////// /////////////////////////////// PARSE FUNCTIONS FUNCTIONS //////////////////////////////// //////////////////////////////////////////////////////////////////////////////////////////// // see "BigFloatTryParseNotes.txt" for additional notes ///

/// The input decimal/hex/binary number. /// Optional apply positive or negative base-2 scaling.(default is zero) public static BigFloat Parse(string numericString, int scale = 0) { bool success = TryParse(numericString, out BigFloat biRes, scale); if (!success) { throw new ArgumentException("Unable to convert string to BigFloat."); } biRes.AssertValid(); return biRes; } ///

/// Parses a to a BigFloat. /// This function supports: /// - Positive or negative leading signs or no sign. /// - Radix point (aka. decimal point for base 10) /// - Hex strings starting with a [-,+,_]0x (radix point and sign supported) /// - Binary strings starting with a [-,+,_]0b (radix point and sign supported) ///

/// The input decimal/hex/binary number. /// The resulting BigFloat. Zero is returned if conversion failed. /// Optional apply positive or negative base-2 scaling.(default is zero) /// Returns true if successful. public static bool TryParse(string numericString, out BigFloat result, int scale = 0) { //string orgValue = numericString; if (string.IsNullOrEmpty(numericString)) { result = new BigFloat(0); return false; } // Let us check for invalid short strings, 0x___ , or 0b___ { int locAfterSign = (numericString[0] is '-' or '+') ? 1 : 0; if (numericString.Length == locAfterSign) //[-,+][END] - fail { result = new BigFloat(0); return false; } else if (numericString[locAfterSign] == '0') //[-,+]0___ { bool isNeg = numericString[0] == '-'; if (numericString.Length > 2 && numericString[locAfterSign + 1] is 'b' or 'B') //[-,+]0b___ { // remove leading "0x" or "-0x" return TryParseBinary(numericString.AsSpan(isNeg ? 3 : 2), out result, scale, isNeg ? -1 : 0); } else if (numericString.Length > 2 && numericString[locAfterSign + 1] is 'x' or 'X') //[-,+]0x___ { return TryParseHex(numericString, out result, scale); } //else { } // [-,+]0[END] OR [-,+]0___ - continue(exceptions handled by BigInteger.Parse) } } //else if (numericString[1] > '0' && numericString[1] <= '9') { } // [-,+][1-9]__ - continue(exceptions handled by BigInteger.Parse) //else if (numericString[1] == '.') { } // [-,+].___ - continue(exceptions handled by BigInteger.Parse) int radixLoc = numericString.IndexOf('.'); // There is a decimal point, so let's remove it to convert it to a BigInteger. if (radixLoc >= 0) { numericString = numericString.Remove(radixLoc, 1); } // Check for 'e' like 123e10 or 123.123e+100 int eLoc = numericString.IndexOf('e'); int exp = 0; if (eLoc > 0) { int endOfNub = eLoc; int begOfExp = eLoc + 1; int expSign = 1; char sign = numericString[eLoc + 1]; if (sign == '+') { begOfExp++; } if (sign == '-') { begOfExp++; expSign = -1; } string expString = numericString[begOfExp..]; exp = int.Parse(expString) * expSign; numericString = numericString[0..endOfNub]; } // now that we removed the "." and/or "e", let us make sure the length is not zero if (numericString.Length == 0) { result = new BigFloat(0); return false; } if (!BigInteger.TryParse(numericString.AsSpan(), out BigInteger asInt)) { result = new BigFloat(0); return false; } // There is no decimal point, so let's use BigInteger to convert. if (radixLoc < 0) { radixLoc = numericString.Length; } if (asInt.IsZero) { int scaleAmt = (int)((radixLoc - numericString.Length + exp) * 3.32192809488736235); result = new BigFloat(BigInteger.Zero, scaleAmt, 0); return true; } // If the user specifies a one (e.g., 1XXX OR 1 OR 0.01), the intended precision is closer to 2 bits. if (BigInteger.Abs(asInt).IsOne) { asInt <<= 1; scale -= 1; } // Set ROUND to 1 to enable round to nearest. // When 1, an extra LSBit is kept and if it's set it will round up. (e.g. 0.1011 => 0.110) const int ROUND = 1; BigInteger intPart; int radixDepth = numericString.Length - radixLoc - exp; if (radixDepth == 0) { result = new BigFloat(asInt, scale); } else if (radixDepth >= 0) //111.111 OR 0.000111 { BigInteger a = BigInteger.Pow(5, radixDepth); int multBitLength = (int)a.GetBitLength(); multBitLength += (int)(a >> (multBitLength - 2)) & 0x1; // Round up if closer to larger size int shiftAmt = multBitLength + ExtraHiddenBits - 1 + ROUND; // added "-1" because it was adding one to many digits // make asInt larger by the size of "a" before we dividing by "a" intPart = (((asInt << shiftAmt) / a) + ROUND) >> ROUND; scale += -multBitLength + 1 - radixDepth; result = new BigFloat(intPart, scale, true); } else // 100010XX { BigInteger a = BigInteger.Pow(5, -radixDepth); int multBitLength = (int)a.GetBitLength(); int shiftAmt = multBitLength - ExtraHiddenBits - ROUND; // Since we are making asInt larger by multiplying it by "a", we now need to shrink it by size "a". intPart = (((asInt * a) >> shiftAmt) + ROUND) >> ROUND; scale += multBitLength - radixDepth; result = new BigFloat(intPart, scale, true); } //Console.WriteLine( // $"Cur: {orgValue} -> {asInt,5}/{a,7}[{shiftAmt,3}] " + // $"->{asInt,3}({BigIntegerToBinaryString(asInt),10})[{BigIntegerToBinaryString(asInt).Length}] " + // $"->{BigInteger.Abs(intPart),3}({BigIntegerToBinaryString(BigInteger.Abs(intPart)),10})[{BigIntegerToBinaryString(BigInteger.Abs(intPart)).Length}] " + // $"-> AsBF: {result,11} " + // $"AsDbl: {double.Parse(orgValue),8}({DecimalToBinary(double.Parse(orgValue), 40)})"); result.AssertValid(); return true; } // Allowed: // * ABC.DEF // * abc.abc both uppercase/lowercases okay // * -ABC.DEF leading minus okay // * 123 456 789 spaces or commas okay // * {ABC.DEF} wrapped in {..} or (..) or ".." // * ABC_____ trailing spaces okay // Not Allowed: // * 0xABC.DEF leading 0x - use Parse for this) // * {ABC.DEF must have leading and closing bracket // * {ABC.DEF) brackets types must match // * {{ABC.DEF}} limit of one bracket only // * 123,456 789 mixing different kinds of separators) ///

/// Parses a hex string to a BigFloat. It supports a radix point(like a decimal point in base 10) and /// negative numbers. It will also ignore spaces and tolerate values wrapped with double quotes and brackets. ///

/// The value to parse. /// (out) The returned result. /// (optional) Any additional power-of-two scale amount to include. Negative values are okay. /// Returns true if successful. public static bool TryParseHex(ReadOnlySpan input, out BigFloat result, int additionalScale = 0) { if (input.IsEmpty) { result = 0; return false; } bool usingComma = false; bool usingSpace = false; int radixLocation = 0; int BraceTypeAndStatus = 0; // 0=not used, 1=usingCurlBraces, 3=usingRoundBrackets, 4=usingParentheses, [neg means it has been closed] // Go through and remove invalid chars int destLoc = 1; // skip negative or positive sign bool isNeg = input[0] == '-'; int inputCurser = (isNeg || input[0] == '+') ? 1 : 0; Span cleaned = stackalloc char[input.Length - inputCurser + 1]; cleaned[0] = '0'; // Ensure we have a positive number for (; inputCurser < input.Length; inputCurser++) { char c = input[inputCurser]; switch (c) { case (>= '0' and <= '9') or (>= 'a' and <= 'f') or (>= 'A' and <= 'F'): cleaned[destLoc++] = c; break; case '.': if (radixLocation != 0) { // radix point already found earlier result = 0; return false; } radixLocation = destLoc; break; case ' ': if (usingComma) { // already using Commas result = 0; return false; } usingSpace = true; break; case ',': if (usingSpace) { // already using Spaces result = 0; return false; } usingComma = true; break; case '{': if (BraceTypeAndStatus != 0) { // already using Spaces result = 0; return false; } BraceTypeAndStatus = 1; break; case '}': if (BraceTypeAndStatus != 1) { // fail: no had leading '{' or another type used result = 0; return false; } BraceTypeAndStatus = -1; break; case '(': if (BraceTypeAndStatus != 0) { // already using Spaces result = 0; return false; } BraceTypeAndStatus = 3; break; case ')': if (BraceTypeAndStatus != 3) { // fail: no had leading '(' or another type used result = 0; return false; } BraceTypeAndStatus = -3; break; case '"': if (BraceTypeAndStatus is not 0 or 4) { // already using Spaces result = 0; return false; } if (BraceTypeAndStatus == 4) { BraceTypeAndStatus = -4; } break; default: // fail: unexpected char found result = 0; return false; } // if we hit a closing brace/bracket/param then only whitespace remaining if (BraceTypeAndStatus < 0) { // should just be whitespace left after closing brace for (; inputCurser < input.Length; inputCurser++) { if (!char.IsWhiteSpace(input[inputCurser])) { // only whitespace expected after closing brace result = 0; return false; } } break; } } // check if no digits were found if (destLoc <= 1) { result = 0; return false; } // radixLocation is the distance from the MSB, it should be from the LSB. (or leave at 0 if radix point not found) if (radixLocation > 0) { radixLocation -= destLoc; } // hex are just bits of 4 so the scale is easy int newScale = (radixLocation * 4) + additionalScale; if (!BigInteger.TryParse(cleaned, NumberStyles.AllowHexSpecifier, null, out BigInteger asInt)) { result = new BigFloat(0); return false; } if (isNeg) { asInt = BigInteger.Negate(asInt); } result = new BigFloat(asInt, newScale); return true; } ///

/// Converts the binary number in a string to a BigFloat. /// If it fails, an exception is thrown. /// e.g, '-11111100.101' would set the BigFloat to that rawValue, -252.625. ///

/// The binary string input. It should be only [0,1,-,.] /// (optional)Additional scale - can be positive or negative /// (optional)Forces a sign on the output. [negative int = force negative, 0 = do nothing, positive int = force positive] /// (optional)The number of bits that should be included in the sub-precision hidden-bits. /// A BigFloat result of the input binary string. public static BigFloat ParseBinary(string input, int scale = 0, int forceSign = 0, int includesHiddenBits = -1) { ArgumentException.ThrowIfNullOrEmpty(input); // .Net 7 or later //ArgumentNullException.ThrowIfNullOrWhiteSpace(input); // .Net 8 or later return !TryParseBinary(input.AsSpan(), out BigFloat result, scale, forceSign, includesHiddenBits) ? throw new ArgumentException("Unable to convert the binary string to a BigFloat.", input) : result; } ///

/// Converts the binary text in ReadOnlySpan to a BigFloat. /// e.g. '-11111100.101' would set the BigFloat to that rawValue, -252.625. ///

/// The binary string input. It should be only [0,1,-,.] /// (out) The BigFloat result. /// (optional)Additional scale - can be positive or negative /// (optional)Forces a sign on the output. [negative int = force negative, 0 = do nothing, positive int = force positive] /// (optional)The number of bits that should be included in the sub-precision hidden-bits. /// Returns false if it fails or is given an empty or null string. public static bool TryParseBinary(ReadOnlySpan input, out BigFloat result, int scale = 0, int forceSign = 0, int includesHiddenBits = -1) { int inputLen = input.Length; if (inputLen == 0) { result = new BigFloat(0); return false; } byte[] bytes = new byte[(inputLen + 7) / 8]; bool radixPointFound = false; int outputBitPosition = 0; // The current bit we are writing to. // if it starts with a '-' then set negative rawValue to zero bool isNeg = input[0] == '-'; // 0x2D; // if starting with at - or + then headPosition should be 1. int headPosition = isNeg | input[0] == '+' ? 1 : 0; if (forceSign != 0) { isNeg = forceSign < 0; } int orgScale = scale; // 01234567 89012345 // Given the Input String: 00000001 00000010 00000011 // Output Byte Array should be: [2]1 [1]2 [0]3 // // Now we are going to work our way from the end of the string forward. // We work backward to ensure the byte array is correctly aligned. int hiddenBitsFound = -1; int tailPosition = inputLen - 1; for (; tailPosition >= headPosition; tailPosition--) { switch (input[tailPosition]) { case '1': bytes[outputBitPosition >> 3] |= (byte)(1 << (outputBitPosition & 0x7)); goto case '0'; case '0': outputBitPosition++; if (!radixPointFound) { scale--; } break; case '.': // Let's make sure the decimal was not already found. if (radixPointFound) { result = new BigFloat(0); return false; // Function was not successful - duplicate '.' } radixPointFound = true; break; case ',' or '_' or ' ': // allow commas, underscores, and spaces (e.g. 1111_1111_0000) (optional - remove for better performance) break; case ':' or '|': if (hiddenBitsFound >= 0) { // multiple precision spacers found (| or :) result = new BigFloat(0); return false; } hiddenBitsFound = outputBitPosition; break; default: result = new BigFloat(0); return false; // Function was not successful - unsupported char found } } if (outputBitPosition == 0) { result = new BigFloat(0); return false; // Function was not successful - duplicate '.' } // if the user specified a precision spacer (| or :) if (hiddenBitsFound >= 0) { // includedHiddenBits is specified? if so, they must match! if (includesHiddenBits >= 0) { // make sure they match and fail if they do not. if (hiddenBitsFound != includesHiddenBits) { result = new BigFloat(0); return false; } } else // includedHiddenBits NOT specified { includesHiddenBits = hiddenBitsFound; } } //else if (includedHiddenBits >= 0) { } // if no precision spacer (| or :) AND but includedHiddenBits was specified //else { } //nether specified. // Lets add the missing zero hidden bits if (includesHiddenBits >= 0) { int zerosNeededStill = ExtraHiddenBits - includesHiddenBits; //outputBitPosition += zerosNeededStill; if (!radixPointFound) { scale -= zerosNeededStill; } } else { includesHiddenBits = 0; } // If the number is negative, let's perform Two's complement: (1) negate the bits (2) add 1 to the bottom byte //111111110111111111111111111111111111111111111111111111110001010110100001 // 1000000000000000000000000000000000000000000000001110101001011111 if (isNeg) { int byteCount = bytes.Length; // (1) negate the bits for (int i = 0; i < byteCount; i++) { bytes[i] ^= 0xff; } // (2) increment the LSB and increment more significant bytes as needed. bytes[0]++; for (int i = 0; bytes[i] == 0; i++) { if (i + 1 >= byteCount) { break; } bytes[i + 1]++; } } BigInteger bi = new(bytes, !isNeg); result = new BigFloat(bi << (ExtraHiddenBits - includesHiddenBits), radixPointFound ? scale + includesHiddenBits : orgScale, true); result.AssertValid(); return true; // return true if success } ///

/// Converts the binary text in ReadOnlySpan to a BigInteger. /// If it fails it returns false. /// e.g '-11111100.101' would ignore the decimal and set the BigInteger to -252. ///

/// (out) The binary string input. It should be only [-/+, 0,1,' ', period,comma,_] /// The BigInteger result. /// True is successful; False if it fails. public static bool TryParseBinary(ReadOnlySpan input, out BigInteger result) { int inputLen = input.Length; if (inputLen == 0) { result = new BigInteger(0); return false; } byte[] bytes = new byte[(inputLen + 7) / 8]; int outputBitPosition = 0; // The current bit we are writing to. // if it starts with a '-' then set negative rawValue to zero bool isNeg = input[0] == '-'; // 0x2D; // if starting with - or + then headPosition should be 1. int headPosition = isNeg | input[0] == '+' ? 1 : 0; int periodLoc = input.LastIndexOf('.'); int tailPosition = (periodLoc < 0 ? inputLen : periodLoc) - 1; for (; tailPosition >= headPosition; tailPosition--) { switch (input[tailPosition]) { case '1': bytes[outputBitPosition >> 3] |= (byte)(1 << (outputBitPosition & 0x7)); goto case '0'; case '0': outputBitPosition++; break; case ',' or '_' or ' ': // allow commas, underscores, and spaces (e.g. 1111_1111_0000) (optional - remove for better performance) break; default: result = new BigInteger(0); return false; // Function was not successful - unsupported char found } } // If the number is negative, let's perform Two's complement: (1) negate the bits (2) add 1 to the bottom byte if (isNeg) { int byteCount = bytes.Length; // (1) negate the bits for (int i = 0; i < byteCount; i++) { bytes[i] ^= 0xff; } // (2) increment the LSB and increment more significant bytes as needed. bytes[0]++; for (int i = 0; bytes[i] == 0; i++) { if (i + 1 >= byteCount) { break; } bytes[i + 1]++; } } result = new(bytes, !isNeg); // return true if success, if no 0/1 bits found then return false. return outputBitPosition != 0; } /////////////////////////////////////////////////////////////////////////////// ///////////////////////// [END] Parse FUNCTIONS [END] ///////////////////////// /////////////////////////////////////////////////////////////////////////////// /////////////////////////////////////////////////////////////////////////////// ///////////////////////// CompareTo FUNCTIONS ///////////////////////// /////////////////////////////////////////////////////////////////////////////// ///

/// Compares two values and returns... /// Returns negative => this instance is less than other /// Returns Zero => this instance is equal to other (Least significant bits are removed on more accurate number.) /// i.e. Sub-Precision bits rounded and removed. /// e.g. 1.11==1.1, 1.00==1.0, 1.11!=1.10) /// Returns Positive => this instance is greater than other OR is null. ///

public int CompareTo(object obj) // for IComparable { return obj switch { null => 1, // If other is not a valid object reference, this instance is greater. BigFloat => CompareTo((BigFloat)obj), BigInteger => CompareTo((BigInteger)obj), _ => throw new ArgumentException("Object is not a BigFloat") }; } ///

/// Compares the in-precision bits between two values. Only the most significant bit in the HiddenBits is considered. /// Returns negative => this instance is less than other /// Returns Zero => this instance is equal to other (Accuracy of higher number reduced /// i.e. Sub-Precision bits rounded and removed. /// e.g. 1.11==1.1, 1.00==1.0, 1.11!=1.10) /// Returns Positive => this instance is greater than other ///

public int CompareTo(BigFloat other) { if (CheckForQuickCompareWithExponentOrSign(other, out int result)) { return result; } // At this point, the exponent is equal or off by one because of a rollover. int sizeDiff = _size - other._size - Exponent + other.Exponent; BigInteger a = RightShiftWithRound(DataBits, (sizeDiff > 0 ? sizeDiff : 0) + ExtraHiddenBits); BigInteger b = RightShiftWithRound(other.DataBits, (sizeDiff < 0 ? -sizeDiff : 0) + ExtraHiddenBits); return a.CompareTo(b); } ///

/// A more accurate version of CompareTo() however it is not compatible with IEquatable. Compares the two numbers by subtracting them and if they are less then 0|1000 (i.e. Zero) then they are considered equal. /// e.g. Using 10|01111111 AND 10|10000000, CompareTo() returns not equal, but CompareInPrecisionBitsTo() returns Equal /// Returns negative => this instance is less than other /// Returns Zero => this instance is equal to other. (or the difference is less then 0|1000 ) /// i.e. Sub-Precision bits rounded and removed. /// e.g. 1.11 == 1.1, 1.00 == 1.0, 1.11 != 1.10 /// Returns Positive => this instance is greater than other ///

public int CompareInPrecisionBitsTo(BigFloat other) { if (CheckForQuickCompareWithExponentOrSign(other, out int result)) { return result; } // At this point, the exponent is equal or off by one because of a rollover. int sizeDiff = _size - other._size - Exponent + other.Exponent; BigInteger diff = sizeDiff switch { //> 0 => -(other.DataBits - (DataBits >> (sizeDiff - expDifference))), // slightly faster version > 0 => BigFloat.RightShiftWithRound(DataBits, sizeDiff) - other.DataBits, // slightly more precise version //< 0 => -((other.DataBits >> (expDifference - sizeDiff)) - DataBits), // slightly faster version < 0 => DataBits - BigFloat.RightShiftWithRound(other.DataBits, -sizeDiff),// slightly more precise version 0 => DataBits - other.DataBits }; // a quick exit int bytes = diff.GetByteCount(); if (bytes != 4) { return (bytes > 4) ? diff.Sign : 0; } // Since we are subtracting, we can run into an issue where a 0:100000 should be considered a match. e.g. 11:000 == 10:100 diff -= diff.Sign; // decrements towards 0 // Future: need to benchmark A, B or C //int a = RightShiftWithRound(temp, ExtraHiddenBits).Sign; //int b = (BigInteger.Abs(temp) >> (ExtraHiddenBits - 1)).IsZero ? 0 : temp.Sign; int c = ((int)((diff.Sign >= 0) ? diff : -diff).GetBitLength() < ExtraHiddenBits) ? 0 : diff.Sign; return c; } private bool CheckForQuickCompareWithExponentOrSign(BigFloat other, out int result) { if (OutOfPrecision) { result = other.OutOfPrecision ? 0 : -other.DataBits.Sign; return true; } if (other.OutOfPrecision) { result = OutOfPrecision ? 0 : DataBits.Sign; return true; } // Lets see if we can escape early by just looking at the Sign. if (DataBits.Sign != other.DataBits.Sign) { result = DataBits.Sign; return true; } // Lets see if we can escape early by just looking at the Exponent. int expDifference = Exponent - other.Exponent; if (Math.Abs(expDifference) > 1) { result = Exponent.CompareTo(other.Exponent) * DataBits.Sign; return true; } // At this point, the sign is the same, and the exp are within 1 bit of each other. //There are three special cases when the Exponent is off by just 1 bit: // case 1: The smaller of the two rounds up to match the size of the larger and, therefore, can be equal(11 | 111 == 100 | 000) // case 2: The smaller of the two rounds up, but the larger one also rounds up, so they are again not equal(depends on #1 happening first) // case 3: Both round-up and are, therefore, equal //If "this" is larger by one bit AND "this" is not in the format 10000000..., THEN "this" must be larger(or smaller if neg) if (expDifference == 1 && !IsOneBitFollowedByZeroBits) { result = DataBits.Sign; return true; } // If "other" is larger by one bit AND "other" is not in the format 10000000..., THEN "other" must be larger(or smaller if neg) if (expDifference == -1 && !other.IsOneBitFollowedByZeroBits) { result = -Sign; return true; } result = 0; return false; } ///

/// Compares two values(including the hidden precision bits) and returns: /// Returns -1 when this instance is less than /// Returns 0 when this instance is equal to /// Returns +1 when this instance is greater than /// An Equals(Zero) generally should be avoided as missing accuracy in the less accurate number has 0 appended. And these values would need to much match exactly. /// This Function is faster then the CompareTo() as no rounding needs to take place. ///

public int CompareToExact(BigFloat other) { int thisPos = DataBits.Sign; int otherPos = other.DataBits.Sign; // Let's first make sure the signs are the same, if not, the positive input is greater. if (thisPos != otherPos) { // OTHER-> -1 0 1 // -1| X -1 -1 // THIS: 0| 1 X -1 <-Return // 1| 1 1 X return thisPos == 0 ? -otherPos : thisPos; } // At this point the signs are the same. // if both are zero then they are equal if (thisPos == 0 /*&& otherPos == 0*/) { return 0; } //Note: CompareTo would be the opposite for negative numbers // A fast general size check. (aka. Exponent vs Exponent) if ((Scale + _size) != (other.Scale + other._size)) { return (Scale + _size).CompareTo(other.Scale + other._size) * thisPos; } // If we made it here we know that both items have the same exponent if (_size == other._size) { return DataBits.CompareTo(other.DataBits); } if (_size > other._size) { // We must grow the smaller - in this case THIS BigInteger adjustedVal = DataBits << (other._size - _size); return adjustedVal.CompareTo(other.DataBits) * thisPos; } // at this point _size < other._size - we must grow the smaller - in this case OTHER BigInteger adjustedOther = other.DataBits << (_size - other._size); return DataBits.CompareTo(adjustedOther) * thisPos; } ///

/// Compares two values ignoring the least number of significant bits specified. /// e.g. CompareToIgnoringLeastSigBits(0b1001.1111, 0b1000.111101, 3) => (b1001.11, 0b1001.0) /// Valid ranges are from -ExtraHiddenBits and up. /// Returns -1 when is less than /// Returns 0 when is equal to when ignoring the least significant bits. /// Returns 1 when is greater than ///

public static int CompareToIgnoringLeastSigBits(BigFloat a, BigFloat b, int leastSignificantBitsToIgnore) { //if (leastSignificantBitsToIgnore == 0) return a.CompareTo(b); // future: if (leastSignificateBitToIgnore == -ExtraHiddenBits) return CompareToExact(other); // Future: need to benchmark, next line is optional, escapes early if size is small //if (other._size < leastSignificantBitsToIgnore) return 0; leastSignificantBitsToIgnore += ExtraHiddenBits; if (leastSignificantBitsToIgnore < 0) { throw new ArgumentOutOfRangeException(nameof(leastSignificantBitsToIgnore), $"Param cannot be less then -ExtraHiddenBits({-ExtraHiddenBits})."); } int scaleDiff = b.Scale - a.Scale; BigInteger temp = scaleDiff switch { > 0 => (a.DataBits >> scaleDiff) - b.DataBits, // 'a' has more accuracy < 0 => a.DataBits - (b.DataBits >> -scaleDiff), // 'b' has more accuracy _ => a.DataBits - b.DataBits }; // since we are subtracting, we can run into an issue where a 0:100000 should be considered a match. e.g. 11:000 == 10:100 temp -= temp.Sign; //decrements towards 0 // Future: need to benchmark A, B or C // Method A //if (temp.GetBitLength() < (leastSignificantBitsToIgnore-1)) return 0; //return (temp >> (leastSignificantBitsToIgnore - 1)).Sign; // Method B return (BigInteger.Abs(temp).GetBitLength() > (leastSignificantBitsToIgnore - 1)) ? temp.Sign : 0; // Method C //if (temp >= 0) // return (temp >> (leastSignificantBitsToIgnore - 1)).Sign; //else // is neg // return -((-temp) >> (leastSignificantBitsToIgnore - 1)).Sign; } ///

/// Compares two values and returns... /// Returns -1 when this instance is less than the other /// Returns 0 when this instance is equal to the other /// Returns 1 when this instance is greater than the other /// The hidden bits are removed. ///

public int CompareTo(BigInteger bigInteger) { int thisSign = DataBits.Sign; int otherSign = bigInteger.Sign; // A fast sign check. if (thisSign != otherSign) { return thisSign == 0 ? -otherSign : thisSign; } // If both are zero then they are equal. if (thisSign == 0) { return 0; } // A fast general size check. int bigIntegerSize = (int)BigInteger.Abs(bigInteger).GetBitLength(); if (Exponent != bigIntegerSize) { return Exponent.CompareTo(bigIntegerSize) * thisSign; } // Future: Benchmark A and B // Option A: // At this point both items have the same exponent and sign. //int bigIntLargerBy = bigIntegerSize - _size; //return bigIntLargerBy switch //{ // 0 => _int.CompareTo(bigInteger), // < 0 => (_int << bigIntegerSize - _size).CompareTo(bigInteger), // > 0 => _int.CompareTo(bigInteger << _size - bigIntegerSize) //}; // Option B: return RightShiftWithRound(DataBits, -Scale + ExtraHiddenBits).CompareTo(bigInteger); } /////////////////////////////////////////////////////////////////////////////// ////////////////////// [END] CompareTo FUNCTIONS [END] /////////////////////// /////////////////////////////////////////////////////////////////////////////// ///

/// Checks to see if the value is an integer. Returns true if all the bits between the radix point and the middle of ExtraHiddenBits are all 0 or all 1. /// for scale <= 0, if all bits are 0 or 1 between radix and half-way through the ExtraHiddenBits /// for scale >= (ExtraHiddenBits/2), is always true. /// /// if we call it an integer then it should follow that ... /// it should not round up based on ExtraHiddenBits /// Ceiling would round up (and Floor down for negative) ///

public bool IsInteger //v3 - just checks bits between radix and middle of hidden bits { get { int begMask = ExtraHiddenBits >> 1; int endMask = ExtraHiddenBits - Scale; if (begMask <= Scale || begMask >= endMask) { return true; // technically inconclusive though. } BigInteger mask = ((BigInteger.One << (endMask - begMask)) - 1) << begMask; BigInteger maskApplied = DataBits & mask; int bitsSet = (int)BigInteger.PopCount(maskApplied); return (bitsSet == 0) || (bitsSet == endMask - begMask); } } ///

/// Tests to see if the number is in the format of "10000000..." after rounding. ///

public bool IsOneBitFollowedByZeroBits => BigInteger.TrailingZeroCount(DataBits >> (ExtraHiddenBits - 1)) == (_size - ExtraHiddenBits); public ulong Lowest64BitsWithHiddenBits { get { ulong raw = (ulong)(DataBits & ulong.MaxValue); if (DataBits.Sign < 0) { raw = ~raw + (ulong)(((_size >> 64) > 0) ? 1 : 0); } return raw; } } public ulong Lowest64Bits { get { if (DataBits.Sign >= 0) { ulong raw = (ulong)((DataBits >> ExtraHiddenBits) & ulong.MaxValue); return raw; } else if (_size >= ExtraHiddenBits) { return ~(ulong)(((DataBits - 1) >> ExtraHiddenBits) & ulong.MaxValue); //return (ulong)((BigInteger.Abs(_int) >> ExtraHiddenBits) & ulong.MaxValue); //perf: benchmark } else { ulong raw = (ulong)((DataBits >> ExtraHiddenBits) & ulong.MaxValue); //raw--; raw = ~raw; return raw; } } } ///

/// Returns the 64 most significant data bits. If the number is negative the sign is ignored. If the size is smaller then 64 bits, then the LSBs are padded with zeros. ///

public ulong Highest64Bits => (ulong)((BigInteger.IsPositive(DataBits) ? DataBits : -DataBits) >> (_size - 64)); ///

/// Returns the 128 most significant data bits. If the number is negative the sign is ignored. If the size is smaller then 128 bits, then the LSBs are padded with zeros. ///

public UInt128 Highest128Bits => (UInt128)((BigInteger.IsPositive(DataBits) ? DataBits : -DataBits) >> (_size - 128)); ///

/// Rounds to the next integer towards negative infinity. Any fractional bits are removed, negative scales are set /// to zero, and the precision(size) will be resized to just the integer part. ///

public BigFloat Floor() { int bitsToClear = ExtraHiddenBits - Scale; // number of bits to clear from _int // 'Scale' will be zero or positive. (since all fraction bits are stripped away) // 'Size' will be the size of the new integer part. // Precision of the decimal bits are stripped away. // If bitsToClear <= 0, then all fraction bits are implicitly zero and nothing needs to be done. // Example: Scale = 32+7, int=45, size=6+32=38 -> bitsToClear=-7 -101101[10101010010...00010]0000000. if (bitsToClear <= 0) { return this; } // If less then zero, we can just return 0 for positive numbers and -1 for negative. // Example: Scale = -11, int=45, size=6+32=38 -> bitsToClear=32+11 -.00000 101101[10101010010...00010] if (bitsToClear >= _size) { return DataBits.Sign >= 0 ? new BigFloat(0, 0, 0) : new BigFloat(BigInteger.MinusOne << ExtraHiddenBits, 0, 1 + ExtraHiddenBits); } if (DataBits.Sign > 0) { // If Positive and Floor, the size should always remain the same. // If Scale is between 0 and ExtraHiddenBits.. // Example: Scale = 4, int=45, size=6+32=38 -> bitsToClear=32-4 101101[1010.1010010...00010] -> 101101[1010.0000000...00000] if (Scale >= 0) // SCALE >= 0 and SCALE < ExtraHiddenBits { return new BigFloat((DataBits >> bitsToClear) << bitsToClear, Scale, _size); } // If Scale is between -size and 0.. // Example: Scale = -4, int=45, size=6+32=38 -> bitsToClear=32+4 10.1101[10101010010...00010] -> 10.[00000000000...00000] //BigInteger intPart = ((_int >> bitsToClear) + 1) << ExtraHiddenBits; //return new BigFloat((_int >> bitsToClear) + (IsInteger?0:1)); return new BigFloat(DataBits >> bitsToClear); } else // if (_int.Sign <= 0) { // If Negative and Flooring, and the abs(result) is a PowerOfTwo the size will grow by 1. -1111.1 -> -10000, -10000 -> -10000 // Lets just remove the bits and clear ExtraHiddenBits // Example: Scale = 4, int=45, size=8+32=40 -> bitsToClear=32-4 11101101[1010.1010010...00010] -> 11101101[1010.0000000...00000] // clear bitToClear bits _ = ExtraHiddenBits - Math.Max(0, Scale); // If Scale is between 0 and ExtraHiddenBits.. // Example: Scale = 4, int=45, size=6+32=38 -> bitsToClear=32-4 -101101[1010.1010010...00010] -> -101101[1011.0000000...00000] if (Scale >= 0) // SCALE >= 0 and SCALE < ExtraHiddenBits { bool roundsUp = (DataBits & ((1 << bitsToClear) - 1)) > 0; BigInteger intPart = DataBits >> bitsToClear << bitsToClear; int newSize = _size; if (roundsUp) { intPart += 1 << (bitsToClear); newSize = (int)intPart.GetBitLength(); //future: maybe slow (maybe use BigInteger.TrailingZeroCount to detect rollover) } return new BigFloat(intPart, Scale, newSize); } // If Scale is between -size and 0.. // Example: Scale = -4, int=45, size=6+32=38 -> bitsToClear=32+4 -11.1101[10101010010...00010] -> -100.[00000000000...00000] else //if (Scale < 0) { return new BigFloat(DataBits >> bitsToClear); } } } ///

/// Rounds to the next integer towards positive infinity. Any fractional bits are removed, negative scales are set /// to zero, and the precision(size) will be resized to just the integer part. ///

public BigFloat Ceiling() { int bitsToClear = ExtraHiddenBits - Scale; // number of bits to clear from _int // 'Scale' will be zero or positive. (since all fraction bits are stripped away) // 'Size' will be the size of the new integer part. // Precision of the decimal bits are stripped away. // If bitsToClear <= 0, then all fraction bits are implicitly zero and nothing needs to be done. // Example: Scale = 32+7, int=45, size=6+32=38 -> bitsToClear=-7 -101101[10101010010...00010]0000000. if (bitsToClear <= 0) // Scale >= ExtraHiddenBits { return this; } // If less then zero, we can just return 1 for positive numbers and 0 for negative. // Example: Scale = -11, int=45, size=6+32=38 -> bitsToClear=32+11 -.00000 101101[10101010010...00010] if (bitsToClear >= _size) { return DataBits.Sign <= 0 ? new BigFloat(0, 0, 0) : new BigFloat(BigInteger.One << ExtraHiddenBits, 0, 1 + ExtraHiddenBits); } // Radix point is in the ExtraHiddenBits area // Example: Scale = 4, int=45, size=6+32=38 -> bitsToClear=32-4 -101101[1010.1010010...00010] -> -101101[1011.0000000...00000] if (Scale < ExtraHiddenBits) // SCALE >= 0 and SCALE 0) { // If Positive and Ceiling, and the abs(result) is a PowerOfTwo the size will grow by 1. -1111.1 -> -10000, -10000 -> -10000 // Lets just remove the bits and clear ExtraHiddenBits // Example: Scale = 4, int=45, size=6+32=38 -> bitsToClear=32-4 101101[1010.1010010...00010] -> 101101[1010.0000000...00000] // Example: Scale = -4, int=45, size=6+32=38 -> bitsToClear=32+4 10.1101[10101010010...00010] -> 10.[00000000000...00000] if (Scale >= 0) // Scale is between 0 and ExtraHiddenBits { // Example: Scale = 4, int=45, size=6+32=38 -> bitsToClear=32-4 -101101[1010.1010010...00010] -> -101101[1011.0000000...00000] bool roundsUp = (DataBits & ((1 << bitsToClear) - 1)) > 0; BigInteger intPart = DataBits >> bitsToClear << bitsToClear; int newSize = _size; if (roundsUp) { intPart += 1 << (bitsToClear); newSize = (int)intPart.GetBitLength(); //future: maybe slow (maybe use BigInteger.TrailingZeroCount to detect rollover) } return new BigFloat(intPart, Scale, newSize); } // If Scale is between -size and 0.. // Example: Scale = -4, int=45, size=6+32=38 -> bitsToClear=32+4 -11.1101[10101010010...00010] -> -100.[00000000000...00000] else //if (Scale < 0) { // round up if any bits set between (ExtraHiddenBits/2) and (ExtraHiddenBits-Scale) bool roundsUp = (DataBits & (((BigInteger.One << ((ExtraHiddenBits / 2) - Scale)) - 1) << (ExtraHiddenBits / 2))) > 0; BigInteger intPart = DataBits >> bitsToClear << ExtraHiddenBits; if (roundsUp) { intPart += BigInteger.One << ExtraHiddenBits; } int newSize = roundsUp ? (int)intPart.GetBitLength() : _size - bitsToClear + ExtraHiddenBits; //future: maybe slow (maybe use BigInteger.TrailingZeroCount to detect rollover) return new BigFloat(intPart, 0, newSize); } } else // if (_int.Sign <= 0) { // If Negative and Ceiling, the size should always remain the same. // If Scale is between 0 and ExtraHiddenBits.. // Example: Scale = 4, int=45, size=6+32=38 -> bitsToClear=32-4 101101[1010.1010010...00010] -> 101101[1010.0000000...00000] if (Scale >= 0) { return new BigFloat((DataBits >> bitsToClear) << bitsToClear, Scale, _size); } BigInteger intPart = DataBits >> bitsToClear; if (!IsInteger) { intPart++; } return new BigFloat(intPart); } } ///

/// Returns the number of matching leading bits with rounding. /// i.e. The largest number of leading bits that when rounded, become equal. /// i.e. The difference in their Log2 values. /// i.e. size - BitSize(abs(a-b) /// e.g. 10.111 - 10.101 is 00.010 so returns 4 /// /// The Exponent(or Scale + _size) is considered. /// e.g. 100. and 1000. would return 0 /// /// If the signs do not match then 0 is returned. /// /// When a rollover is near these bits are included. /// e.g. 11110 and 100000 returns 3 /// /// HiddenBits are included. ///

/// The first BigFloat to compare to. /// The second BigFloat to compare to. /// (out) Returns the sign of a-b. Example: If a is larger the sign is set to 1. public static int NumberOfMatchingLeadingBitsWithRounding(BigFloat a, BigFloat b, out int sign) { // only 1 bit or less size difference, so we could have a... // 11111111/100000000 that would have difference b1 so 7 matching bits // 11110000/100000000 that would have difference b10000 so 3 matching bits // -11110000/100000000 that would have difference b10000 so 0 matching bits int maxSize = Math.Max(a._size, b._size); int expDiff = a.Exponent - b.Exponent; if (maxSize == 0 || a.Sign != b.Sign || Math.Abs(expDiff) > 1) { sign = (expDiff > 0) ? a.Sign : -b.Sign; return 0; } int scaleDiff = a.Scale - b.Scale; BigInteger temp = (scaleDiff < 0) ? a.DataBits - (b.DataBits << scaleDiff) : (a.DataBits >> scaleDiff) - b.DataBits; sign = temp.Sign; return maxSize - (int)BigInteger.Log2(BigInteger.Abs(temp)) - 1; } ///

/// Returns the number of matching leading bits that exactly match. HiddenBits are included. /// i.e. The number of leading bits that exactly match. /// e.g. 11010 and 11111 returns 2 /// e.g. 100000 and 111111 returns 1 /// If the signs do not match then 0 is returned. /// /// The scale and precision(size) is ignored. /// e.g. 11101000000 and 11111 returns 3 ///

/// The first BigFloat to compare to. /// The second BigFloat to compare to. public static int NumberOfMatchingLeadingBits(BigFloat a, BigFloat b) { if (a.Sign != b.Sign) { return 0; } int sizeDiff = a._size - b._size; int newSize = sizeDiff > 0 ? b._size : a._size; if (newSize == 0) { return 0; } BigInteger temp = (sizeDiff < 0) ? a.DataBits - (b.DataBits << sizeDiff) : (a.DataBits >> sizeDiff) - b.DataBits; return newSize - (int)BigInteger.Log2(BigInteger.Abs(temp)) - 1; } ////////////////////////////////////////////////////////////////// /////////////////////// Operator Overloads /////////////////////// ////////////////////////////////////////////////////////////////// /////////// Operator Overloads: BigFloat <--> BigFloat /////////// ///

Returns true if the left side BigFloat is equal to the right side BigFloat.

public static bool operator ==(BigFloat left, BigFloat right) { return left.CompareTo(right) == 0; } ///

Returns true if the left side BigFloat is not equal to the right BigFloat.

public static bool operator !=(BigFloat left, BigFloat right) { return right.CompareTo(left) != 0; } public static bool operator <(BigFloat left, BigFloat right) { int a = left.CompareTo(right); return a < 0; } public static bool operator >(BigFloat left, BigFloat right) { return left.CompareTo(right) > 0; } public static bool operator <=(BigFloat left, BigFloat right) { return left.CompareTo(right) <= 0; } public static bool operator >=(BigFloat left, BigFloat right) { return left.CompareTo(right) >= 0; } /////////// Operator Overloads: BigFloat <--> BigInteger /////////// ///

Returns true if the left side BigFloat is equal to the right side BigInteger. If the BigFloat is not an integer then always returns false.

public static bool operator ==(BigFloat left, BigInteger right) { return left.IsInteger && new BigFloat(right).CompareTo(left) == 0; } ///

Returns true if the left side BigInteger is equal to the right side BigFloat. If the BigFloat is not an integer then always returns false.

public static bool operator ==(BigInteger left, BigFloat right) { return right.IsInteger && new BigFloat(left).CompareTo(right) == 0; } ///

Returns true if the left side BigFloat is not equal to the right side BigInteger. If the BigFloat is not an integer then always returns true.

public static bool operator !=(BigFloat left, BigInteger right) { return !(left == right); } ///

Returns true if the left side BigInteger is not equal to the right side BigFloat. If the BigFloat is not an integer then always returns true.

public static bool operator !=(BigInteger left, BigFloat right) { return !(left == right); } /////////// Operator Overloads: BigFloat <--> ulong/long /////////// ///

Returns true if the left side BigFloat is equal to the right side unsigned long.

public static bool operator ==(BigFloat left, ulong right) { return new BigFloat(right).CompareTo(left) == 0; } ///

Returns true if the left side BigFloat is equal to the right side long.

public static bool operator ==(BigFloat left, long right) { return new BigFloat(right).CompareTo(left) == 0; } ///

Returns true if the left side long is equal to the right side BigFloat.

public static bool operator ==(long left, BigFloat right) { return new BigFloat(left).CompareTo(right) == 0; } ///

Returns true if the left side unsigned long is equal to the right side BigFloat.

public static bool operator ==(ulong left, BigFloat right) { return new BigFloat(left).CompareTo(right) == 0; } ///

Returns true if the left side BigFloat is not equal to the right side unsigned long.

public static bool operator !=(BigFloat left, ulong right) { return new BigFloat(right).CompareTo(left) != 0; } ///

Returns true if the left side unsigned long is not equal to the right side BigFloat.

public static bool operator !=(ulong left, BigFloat right) { return new BigFloat(left).CompareTo(right) != 0; } ///

Returns true if the left side BigFloat is equal to the right side unsigned long.

public static bool operator !=(BigFloat left, long right) { return new BigFloat(right).CompareTo(left) != 0; } public static bool operator !=(long left, BigFloat right) { return new BigFloat(left).CompareTo(right) != 0; } public static bool operator <(long left, BigFloat right) { return new BigFloat(left).CompareTo(right) < 0; } public static bool operator <(BigFloat left, long right) { return left.CompareTo(new BigFloat(right)) < 0; } public static bool operator <(BigFloat left, ulong right) { return left.CompareTo(new BigFloat(right)) < 0; } public static bool operator <(ulong left, BigFloat right) { return new BigFloat(left).CompareTo(right) < 0; } public static bool operator >(BigFloat left, long right) { return left.CompareTo(new BigFloat(right)) > 0; } public static bool operator >(BigFloat left, ulong right) { return left.CompareTo(new BigFloat(right)) > 0; } public static bool operator >(ulong left, BigFloat right) { return new BigFloat(left).CompareTo(right) > 0; } public static bool operator >(long left, BigFloat right) { return new BigFloat(left).CompareTo(right) > 0; } public static bool operator <=(BigFloat left, long right) { return left.CompareTo(new BigFloat(right)) <= 0; } public static bool operator <=(long left, BigFloat right) { return new BigFloat(left).CompareTo(right) <= 0; } public static bool operator <=(ulong left, BigFloat right) { return new BigFloat(left).CompareTo(right) <= 0; } public static bool operator <=(BigFloat left, ulong right) { return left.CompareTo(new BigFloat(right)) <= 0; } public static bool operator >=(long left, BigFloat right) { return new BigFloat(left).CompareTo(right) >= 0; } public static bool operator >=(BigFloat left, long right) { return left.CompareTo(new BigFloat(right)) >= 0; } public static bool operator >=(BigFloat left, ulong right) { return left.CompareTo(new BigFloat(right)) >= 0; } public static bool operator >=(ulong left, BigFloat right) { return new BigFloat(left).CompareTo(right) >= 0; } ///

/// Performs a modulus operation. For negative numbers there are two approaches, a math and programmers version. For negative numbers this version uses the programmers version. /// see: https://github.com/microsoft/calculator/issues/111 ///

public static BigFloat operator %(BigFloat dividend, BigFloat divisor) { // nice video on negative https://www.youtube.com/watch?v=AbGVbgQre7I return Remainder(dividend, divisor); } // Anonymous 1/22/2021 at 9:06 AM https://www.java67.com/2014/11/modulo-or-remainder-operator-in-java.html : // Technically(n % m) is a remainder operator, but not a modulus operator. There's a difference. // For nonnegative n and positive m, the remainder and modulus are the same thing. But for negative n, they are // different. -2 mod 10 is defined to be 8 in standard mathematics, going back centuries. But the remainder // of -2 over 10 is -2. So (-2 % 10) gives -2, which is the remainder.It doesn't give 8, which is the mod. // // If you ever need an actual mod operator, then (((n % m) + m) % m) gives the mod.In most cases where you have a // negative n, you'll actually need to find the mod rather than the remainder. So it's unfortunate Java doesn't // have a mod operator built in. It inherited this from C. // // I wish C had defined % to be remainder and %% to be mod.That would have allowed us to avoid having to use ugly // constructions like(((n % m) + m) % m) when we need the mod. // Some languages actually do have both.For example, LISP has both "mod" and "rem" as operators.So does Ada. But // sadly, C and all its descendants have only rem, not mod. // // Also nice video on negatives: https://www.youtube.com/watch?v=AbGVbgQre7I // More notes here on windows calculator: https://github.com/microsoft/calculator/issues/111 ///

/// Performs a Modulus operation. /// For positive values, Modulus is identical to Remainder, for negatives, Modulus and Remainder differ. /// The remainder is slightly faster. ///

// see BifFloatModuloNotes.txt for additional notes public static BigFloat Remainder(BigFloat dividend, BigFloat divisor) { int scaleDiff = dividend.Scale - divisor.Scale; return scaleDiff switch { > 0 => new(((dividend.DataBits << scaleDiff) % divisor.DataBits) >> scaleDiff, dividend.Scale, true), < 0 => new((dividend.DataBits % (divisor.DataBits >> scaleDiff)) << scaleDiff, divisor.Scale, true), 0 => new(dividend.DataBits % divisor.DataBits, divisor.Scale, true), }; // Alternative version - less accurate. //return scaleDiff switch //{ // > 0 => new(dividend._int % (divisor._int >> scaleDiff), dividend.Scale, true), // < 0 => new((dividend._int << scaleDiff) % divisor._int, divisor.Scale, true), // _ => new(dividend._int % divisor._int, divisor.Scale, true), //}; } ///

/// Performs a Modulus operation. /// For positive values, Modulus is identical to Remainder, for negatives, Modulus and Remainder differ. /// The remainder is slightly faster. ///

// see BifFloatModuloNotes.txt for additional notes public static BigFloat Mod(BigFloat dividend, BigFloat divisor) { return Remainder(dividend, divisor) + ((dividend < 0) ^ (divisor > 0) ? 0 : divisor); } ///

/// Bitwise Complement Operator - Reverses each bit in the data bits. Scale is not changed. /// The size is reduced by at least 1 bit. This is because the leading bit is flipped to a zero. ///

public static BigFloat operator ~(BigFloat value) { BigInteger temp = value.DataBits ^ ((BigInteger.One << value._size) - 1); return new(temp, value.Scale, true); } //future: add logic operations //public static BigFloat operator &(BigFloat left, BigInteger right); //public static BigFloat operator |(BigFloat left, BigInteger right); //public static BigFloat operator ^(BigFloat left, BigInteger right); ///

/// Left shift - Increases the size by adding least-signification zero bits. /// i.e. The precision is enhanced. /// No rounding is preformed. ///

/// The value the shift should be applied to. /// The number of bits to shift left. /// A new BigFloat with the internal 'int' up shifted. public static BigFloat operator <<(BigFloat x, int shift) { return new(x.DataBits << shift, x.Scale, x._size + shift); } ///

/// Right shift - Decreases the size by removing the least-signification bits. /// i.e. The precision is reduced. /// No rounding is preformed. Scale is unaffected. ///

/// The value the shift should be applied to. /// The number of bits to shift right. /// A new BigFloat with the internal 'int' down shifted. public static BigFloat operator >>(BigFloat x, int shift) { return new(x.DataBits >> shift, x.Scale, x._size - shift); } public static BigFloat operator +(BigFloat r) { return r; } public static BigFloat operator -(BigFloat r) { return new(-r.DataBits, r.Scale, r._size); } public static BigFloat operator ++(BigFloat r) { // hidden bits = 4 // A) 1111|1111__. => 1111|1111<< 6 +1 => 1111|1111__. // B) 1111|1111_. => 1111|1111<< 5 +1 => 10000|0000#. // C) 1111|1111. => 1111|1111<< 4 +1 => 10000|0000. // D) 1111|1.111 => 1111|1111<< 1 +1 => 10000|0.111 // E) 1111.|1111 => 1111|1111<< 0 +1 => 10000.|1111 // F) 111.1|1111 => 1111|1111<< -1 +1 => 1000.1|1111 // G) .1111|1111 => 1111|1111<< -4 +1 => 1.1111|1111 // H) .01111|1111 => 1111|1111<< -5 +1 => 1.01111|1111 int onesPlace = ExtraHiddenBits - r.Scale; if (onesPlace < 1) { return r; // A => -2 or less } // In the special case, we may not always want to round up when adding a 1 bit just below the LSB. if (onesPlace == -1 && !r.DataBits.IsEven) { onesPlace = 0; } BigInteger intVal = r.DataBits + (BigInteger.One << onesPlace); int sizeVal = (int)BigInteger.Abs(intVal).GetBitLength(); // int sizeVal = (onesPlace > r._size) ? onesPlace +1 : //perf: faster just to calc // r._size + ((BigInteger.TrailingZeroCount(intVal) == r._size) ? 1 : 0); return new BigFloat(intVal, r.Scale, sizeVal); } public static BigFloat operator --(BigFloat r) { int onesPlace = ExtraHiddenBits - r.Scale; if (onesPlace < 1) { return r; } // In the special case, we may not always want to round up when adding a 1 bit just below the LSB. if (onesPlace == -1 && !r.DataBits.IsEven) { onesPlace = 0; } BigInteger intVal = r.DataBits - (BigInteger.One << onesPlace); int sizeVal = (int)BigInteger.Abs(intVal).GetBitLength(); //int sizeVal = (onesPlace > r._size) ? onesPlace +1 : //perf: faster just to calc // r._size + ((BigInteger.TrailingZeroCount(intVal) == r._size) ? 1 : 0); return new BigFloat(intVal, r.Scale, sizeVal); } public static BigFloat operator +(BigFloat r1, BigFloat r2) { // Shortcuts (to benchmark, does it actually save any time) // Given ExtraHiddenBits = 8, a number like "B2D"00 + 0.00"3F" should be just "B2D"00 since the smaller number is below the precision range. // // Example: "12345678"9ABCDEF0________. (Size: 29, _size: 61, Scale: 64) // + "12"34560.789A (Size: 5, _size: 37, Scale: 20) // = 12345678"9ABCDEF0________. // // (if 64(r1.Scale) > 37(r2._size) + (20)r2.Scale then just return r1) int scaleDiff = r1.Scale - r2.Scale; if (scaleDiff > r2._size) { return r1; } if (-scaleDiff > r1._size) { return r2; } // Any Precision that is below the precision of the number with a larger scale would be dropped off. // Example: all the 7's would just be dropped off. // "5555"00000 input:5555 shift:5(decimal) // +"55577777" // ------------- // "49"9922223 <--- answer is 50, only 2 significant digits. if (r1.Scale == r2.Scale) { BigInteger intVal = r1.DataBits + r2.DataBits; int sizeVal = (int)BigInteger.Abs(intVal).GetBitLength(); return new BigFloat(intVal, r1.Scale, sizeVal); } else if (r1.Scale < r2.Scale) { BigInteger intVal = RightShiftWithRound(r1.DataBits, -scaleDiff) + r2.DataBits; int sizeVal = (int)BigInteger.Abs(intVal).GetBitLength(); return new BigFloat(intVal, r2.Scale, sizeVal); } else // if (r1.Scale > r2.Scale) { BigInteger intVal = r1.DataBits + RightShiftWithRound(r2.DataBits, scaleDiff); int sizeVal = (int)BigInteger.Abs(intVal).GetBitLength(); return new BigFloat(intVal, r1.Scale, sizeVal); } } ////////////////////////////////////////////////////////////////////////////////////////////////////////////// //////////////////////////////////////// Rounding, Shifting, Truncate //////////////////////////////////////// ////////////////////////////////////////////////////////////////////////////////////////////////////////////// /* | BI | RoundTo| Scales |Can Round | Shift | * | or | nearest| or Sets | up to | or | Public | BF | int | Size |larger Size| Size by | notes ==================================================================================================================== P BF =(<<, >>)BF | F | No | SetsSize| No | (param) | Provides a shift similar to other data types. (removes/adds bits) BI =DataIntValueWithRound(BI)/Int | I | Rounds | Scales | Yes |ExtraHiddenBits| return WouldRound(val) ? (val >> ExtraHiddenBits) + 1 : val >> ExtraHiddenBits; BI =DataIntValueWithRound(BI,bool)/Int | I | Rounds | Scales | Yes |ExtraHiddenBits| return needToRound ? (val >> ExtraHiddenBits) + 1 : val >> ExtraHiddenBits; P BF =RightShiftWithRound(BF,int) | F | Rounds | Scales | Yes | (param) | P BF =RightShiftWithRound(BF,int,out) | F | Rounds | Scales | Yes | (param) | BI =RightShiftWithRound(BI,ref int) | I | Rounds | Scales | Yes | (param) | BI =RightShiftWithRound(BI, int) | I | Rounds | Scales | Yes | (param) | BF =TruncateByAndRound(BF, int) | F | Rounds | SetsSize| Yes | (param) | BF =TruncateToAndRound(BI, int) | I | Rounds | SetsSize| Yes | (param) | BF =UpScale(BI, int) | I | No | Scales | No | (param) | i.e. Shifts scale up BF =DownScale(BI, int) | I | No | Scales | No | (param) | i.e. Shifts using down BF =AdjustScale(BI, int) | I | No | Scales | No | (param) | i.e. Shifts using up or down BF =SetPrecision(BF, int) | F | No | SetsSize| No | (param) | P BF =SetPrecisionWithRound(BF,int) | F | Rounds | SetsSize| Yes | (param) | BF =ExtendPrecision(BF, int) | F | No | SetsSize| No | (param) | BI Int | I | Rounds | Scales | Yes |ExtraHiddenBits| i.e. Int => DataIntValueWithRound(_int); Other: | | | | | | P bool=WouldRound() | F | Rounds | n/a | Yes |ExtraHiddenBits| return WouldRound(_int, ExtraHiddenBits); P bool=WouldRound(int bottomBitsRemoved) | F | Rounds | n/a | Yes |ExtraHiddenBits| return WouldRound(_int, bottomBitsRemoved); P bool=WouldRound(BI) | F | Rounds | n/a | Yes |ExtraHiddenBits| return WouldRound(bi, ExtraHiddenBits); P bool=WouldRound(BI,int bottomBitsRemove) | F | Rounds | n/a | Yes | (param) | return !(bi & ((BigInteger)1 << (bottomBitsRemoved - 1))).OutOfPrecision; * SetsSize = forces a particular size using the param (instead of add/removes the size) * Scale = adjusts the size by a specific amt */ ///////////////////////////////// //// WouldRound() ///////////////////////////////// ///

/// Checks to see if the integerPart would round-up if the ExtraHiddenBits were removed. /// e.g. 11010101 with 3 bits removed would be 11011. ///

/// Returns true if this integerPart would round away from zero. public bool WouldRound() { return WouldRound(DataBits, ExtraHiddenBits); } ///

/// Checks to see if this integerPart would round-up given bottomBitsRemoved. /// e.g. 11010101 with bottomBitsRemoved=3 would be 11011 ///

/// The number of newSizeInBits from the least significant bit where rounding would take place. /// Returns true if this integerPart would round away from zero. public bool WouldRound(int bottomBitsRemoved) { return WouldRound(DataBits, bottomBitsRemoved); } ///

/// Checks to see if this integerPart would round-up if ExtraHiddenBits are removed. ///

/// The BigInteger we would like check if it would round up. /// Returns true if this integerPart would round away from zero. public static bool WouldRound(BigInteger bi) { return WouldRound(bi, ExtraHiddenBits); } private static bool WouldRound(BigInteger val, int bottomBitsRemoved) { // for .net 7 and later use ">>>" instead of >> for a slight performance boost. bool isPos = val.Sign >= 0; return isPos ^ ((isPos ? val : val - 1) >> (bottomBitsRemoved - 1)).IsEven; } ///////////////////////////////////////////// //// DataIntValue() for BigInteger //// ///////////////////////////////////////////// ///

/// Retrieves the internal data bits and removes ExtraHiddenBits and rounds. ///

/// The _int part where to remove ExtraHiddenBits and round. private static BigInteger DataIntValueWithRound(BigInteger x) { return RightShiftWithRound(x, ExtraHiddenBits); } ///

/// Removes ExtraHiddenBits and rounds. It also requires the current size and will adjust it if it grows. ///

/// The _int part where to remove ExtraHiddenBits and round. private static BigInteger DataIntValueWithRound(BigInteger x, ref int size) { return RightShiftWithRound(x, ExtraHiddenBits, ref size); } ///////////////////////////////////////////// //// RightShift() for BigInteger //// ///////////////////////////////////////////// // Performance idea: what about doing: rolledOver = (x == (1 << x.bitLen)) (do this before the inc for neg numbers and do this after the inc for pos numbers) // Performance idea: what about doing: "(b & uint.MaxValue) == 0" first as a quick check. (or use x.IsPowerOfTwo) // Performance idea: bool rolledOver = b.IsPowerOfTwo || (b<<1).IsPowerOfTwo; ///

/// Removes x number of bits of precision. /// A special case of RightShift(>>) that will round based off the most significant bit in the removed bits(bitsToRemove). /// This function will not adjust the scale. Like any shift, the value with be changed by some power of 2. /// Caution: Round-ups may percolate to the most significant bit, adding an extra bit to the size. /// e.g. RightShiftWithRound(0b111, 1) --> 0b100 /// Notes: /// * Works on positive and negative numbers. /// * If the part being removed has the most significant bit set, then the result will be rounded away from zero. ///

/// The source BigInteger we would like right-shift. /// The number of bits to reduce the precision. /// The rounded result of shifting val to the right by bitsToRemove. public static BigInteger RightShiftWithRound(BigInteger val, in int bitsToRemove) { // if bitsToRemove is negative, we would up-shift and no rounding is needed. if (bitsToRemove < 0) { return val >> bitsToRemove; } // BigInteger will automatically round when down-shifting larger negative values. if (val.Sign < 0) val--; BigInteger result2 = val >> bitsToRemove; if (!(val >>> (bitsToRemove - 1)).IsEven) { result2++; } return result2; } ///

/// Removes x number of bits of precision. It also requires the current size and will increment it if it grows by a bit. /// If the most significant bit of the removed bits is set, then the least significant bit will increment away from zero. /// e.g. 1010010 << 2 = 10101 /// Caution: Round-ups may percolate to the most significant bit, adding an extra bit to the size. /// THIS FUNCTION IS HIGHLY TUNED! ///

/// The source BigInteger we would like right-shift. /// The number of bits to reduce the precision. /// IN: the size of Val. OUT: The size of the output. public static BigInteger RightShiftWithRound(BigInteger val, in int bitsToRemove, ref int size) { size = Math.Max(0, size - bitsToRemove); if (val.Sign >= 0) { BigInteger result = val >>> bitsToRemove; if (!(val >>> (bitsToRemove - 1)).IsEven) { result++; if ((result >> size).IsOne) { size++; } } return result; } // is Neg val--; BigInteger result2 = val >> bitsToRemove; if ((val >>> (bitsToRemove - 1)).IsEven) { if (((result2 - 1) >>> size).IsEven) { size++; } } else { result2++; } return result2; } ///

/// Removes x number of bits of precision. /// If the most significant bit of the removed bits is set, then the least significant bit will increment away from zero. /// e.g. 1010010 << 2 = 10101 /// Caution: Round-ups may percolate to the most significate bit. This function will automaticlly remove that extra bit. /// e.g. 1111111 << 2 = 10000 /// Also see: ReducePrecision, TruncateByAndRound, RightShiftWithRoundWithCarryDownsize ///

/// The result of val being right shifted and rounded. The size will be "size-bitsToRemove". /// The source BigInteger we would like right-shift. /// The number of bits that will be removed. /// The size of the input value if available. If negative number then val.GetBitLength() is called. /// Returns True if an additional bit needed to be removed to achieve the desired size because of a round up. /// e.g. 1111111 << 2 = 10000 public static bool RightShiftWithRoundWithCarryDownsize(out BigInteger result, BigInteger val, in int bitsToRemove, int size = -1) { if (size < 0) { size = (int)val.GetBitLength(); } size = Math.Max(0, size - bitsToRemove); if (val.Sign >= 0) { result = val >> bitsToRemove; // on .net 7 and later use >>> instead of >> for a slight performance boost if (!(val >> (bitsToRemove - 1)).IsEven) // on .net 7 and later use >>> instead of >> for a slight performance boost { result++; if ((result >> size).IsOne) { //rounded up to larger size so remove zero to keep it same size. result >>= 1; return true; } return false; } } else // is Neg { val--; result = val >> bitsToRemove; if ((val >> (bitsToRemove - 1)).IsEven) // on .net 7 and later use >>> instead of >> for a slight performance boost { if (((result - 1) >> size).IsEven) // on .net 7 and later use >>> instead of >> for a slight performance boost { result >>= 1; return true; } } else { result++; } } return false; } /////////////////////////////////////////////////// //// Set/Reduce Precision for BigFloat //// /////////////////////////////////////////////////// ///

/// Truncates a value by a specified number of bits by increasing the scale and reducing the precision. /// If the most significant bit of the removed bits is set then the least significant bit will increment away from zero. /// e.g. 10.10010 << 2 = 10.101 /// Caution: Round-ups may percolate to the most significant bit, adding an extra bit to the size. /// Example: 11.11 with 1 bit removed would result in 100.0 (the same size) /// This function uses the internal BigInteger RightShiftWithRound(). /// Also see: ReducePrecision, RightShiftWithRoundWithCarryDownsize, RightShiftWithRound ///

/// Specifies the number of least-significant bits to remove. public static BigFloat TruncateByAndRound(BigFloat x, int bitsToRemove) { if (bitsToRemove < 0) { throw new ArgumentOutOfRangeException(nameof(bitsToRemove), $"Param {nameof(bitsToRemove)}({bitsToRemove}) be 0 or greater."); } int newScale = x.Scale + bitsToRemove; int size = x._size; BigInteger b = RightShiftWithRound(x.DataBits, bitsToRemove, ref size); return new(b, newScale, size); } ///

/// Adjust the scale of a value ///

/// The value who's scale should be adjusted. /// The amount to change the scale. /// Returns a BigFloat with the updated scale. public static BigFloat AdjustScale(BigFloat x, int changeScaleAmount) { return new BigFloat(x.DataBits, x.Scale + changeScaleAmount, x._size); } ///

/// This function will reduce the precision of a BigInteger to the number of bits specified. /// If the part being removed has the most significant bit set, then the result will be rounded /// away from zero. This can be used to reduce the precision prior to a large calculation. /// Caution: Round-ups may percolate to the most significant bit, adding an extra bit to the size. /// Example: SetPrecisionWithRound(15, 3) = 8[4 bits] /// Also see: SetPrecision, TruncateToAndRound /// The new requested size. The resulting size might be rounded up. public static BigInteger TruncateToAndRound(BigInteger x, int newSizeInBits) { if (newSizeInBits < 0) { throw new ArgumentOutOfRangeException(nameof(newSizeInBits), $"Param newSizeInBits({newSizeInBits}) be 0 or greater."); } int currentSize = (int)BigInteger.Abs(x).GetBitLength(); BigInteger result = RightShiftWithRound(x, currentSize - newSizeInBits); return result; } ///

/// Sets the precision(and accuracy) of a number by appending 0 bits if too small or cropping bits if too large. /// This can be useful for extending whole or rational numbers precision. /// No rounding is performed. /// Example: SetPrecision(0b1101, 8) --> 0b11010000; SetPrecision(0b1101, 3) --> 0b110 /// Also see: TruncateToAndRound, SetPrecisionWithRound ///

/// The source BigFloat where a new size will be forced. /// The number of zero bits to add. /// A new BigFloat with the requested precision. public static BigFloat SetPrecision(BigFloat x, int newSize) { return new BigFloat(x.DataBits << (newSize - x.Size), x.Scale + (x.Size - newSize), newSize + ExtraHiddenBits); } ///

/// Reduces the precision of the a number but keeps the value the same. /// i.e. Down-shifts the value but and increases the scale. /// Example: ReducePrecision(0b1101.1101, 3) --> 0b1101.1; /// No rounding is performed. /// Also see: TruncateByAndRound, RightShiftWithRoundWithCarryDownsize, RightShiftWithRound ///

public static BigFloat ReducePrecision(BigFloat x, int reduceBy) { return new BigFloat(x.DataBits >> reduceBy, x.Scale + reduceBy, x._size - reduceBy); } ///

/// Reduces the precision to the new specified size. To help maintain the most significant digits, the bits are not simply cut off. /// When reducing the least significant bit will rounded up if the most significant bit is set of the removed bits. /// This can be used to reduce the precision of a number before prior to a calculation. /// Caution: Round-ups may percolate to the most significant bit, adding an extra bit to the size. /// Also see: SetPrecision, TruncateToAndRound ///

/// The desired precision in bits. public static BigFloat SetPrecisionWithRound(BigFloat x, int newSizeInBits) { int reduceBy = x.Size - newSizeInBits; BigFloat result = TruncateByAndRound(x, reduceBy); return result; } ///

/// Extends the precision and accuracy of a number by appending 0 bits. /// e.g. 1.1 --> 1.100000 /// This can be useful for extending whole or rational numbers precision. ///

/// The source BigFloat that will be extended. /// The number of zero bits to add. The number must be positive /// Returns the larger value. public static BigFloat ExtendPrecision(BigFloat x, int bitsToAdd) { return bitsToAdd < 0 ? throw new ArgumentOutOfRangeException(nameof(bitsToAdd), "cannot be a negative number") : new BigFloat(x.DataBits << bitsToAdd, x.Scale - bitsToAdd, x._size + bitsToAdd); } public static BigFloat operator -(BigFloat r1, BigFloat r2) { BigInteger r1Bits = (r1.Scale < r2.Scale) ? (r1.DataBits >> (r2.Scale - r1.Scale)) : r1.DataBits; BigInteger r2Bits = (r1.Scale > r2.Scale) ? (r2.DataBits >> (r1.Scale - r2.Scale)) : r2.DataBits; BigInteger diff = r1Bits - r2Bits; if (r1.Scale < r2.Scale ? r1.Sign < 0 : r2.DataBits.Sign < 0) { diff--; } int size = Math.Max(0, (int)BigInteger.Abs(diff).GetBitLength()); return new BigFloat(diff, r1.Scale < r2.Scale ? r2.Scale : r1.Scale, size); } public static BigFloat PowerOf2(BigFloat val) { BigInteger prod = val.DataBits * val.DataBits; int resSize = (int)prod.GetBitLength(); int shrinkBy = resSize - val._size; prod = RightShiftWithRound(prod, shrinkBy, ref resSize); int resScalePart = (2 * val.Scale) + shrinkBy - ExtraHiddenBits; BigFloat res = new(prod, resScalePart, resSize); AssertValid(res); return res; } ///

/// Calculates a BigFloat to the power of 2 with a maximum output precision required. /// This function can save on compute cycles by not calculating bits that are needed. ///

/// The base. /// The maximum number of bits needed in the output. /// Returns a BigFloat that is val^exp where the precision is public static BigFloat PowerOf2(BigFloat val, int maxOutputPrecisionInBits) { /* valSz resSize skipIf * 3 5-6 maxOutputPrecisionInBits >= valSz*2 * 4 7-8 * 5 9-10 */ int overSized = (val._size * 2) - maxOutputPrecisionInBits - (2 * ExtraHiddenBits); // We can just use PowerOf2 Function since output will never be larger then maxOutputPrecisionInBits. if (overSized <= 1) { BigFloat p2 = PowerOf2(val); // if size difference is 1 BUT the outputSize is still correct just return if (overSized <= 0 || p2._size == maxOutputPrecisionInBits) { return p2; } // output is oversized by 1 return new BigFloat(p2.DataBits, p2.Scale - 1, p2._size); } // at this point it is oversized by at least 2 //oversized by 2 then shrink input by 1 //oversized by 3 then shrink input by 1 //oversized by 4 then shrink input by 2 //oversized by 5 then shrink input by 2 int inputShink = (overSized + 1) / 2; BigInteger valWithLessPrec = val.DataBits >> inputShink; BigInteger prod = valWithLessPrec * valWithLessPrec; int resBitLen = (int)prod.GetBitLength(); int shrinkBy = resBitLen - val._size - (2 * ExtraHiddenBits); int sizePart = resBitLen - shrinkBy; prod = RightShiftWithRound(prod, shrinkBy); int resScalePart = (2 * val.Scale) + shrinkBy - ExtraHiddenBits; return new(prod, resScalePart, sizePart); } //todo: finish and test (or delete) /////

///// Calculates a BigFloat to the power of 2 with a maximum output precision required. ///// This function can save on compute cycles by not calculating bits that are needed. /////

///// The base. ///// The maximum number of bits needed in the output. ///// Returns a BigFloat that is val^exp where the precision is //public static BigFloat PowerOf2(BigFloat val, int maxOutputPrecisionInBits) //{ // /* valSz resSize skipIf // * 3 5-6 maxOutputPrecisionInBits >= valSz*2 // * 4 7-8 // * 5 9-10 */ // int overSized = (val.Size * 2) - maxOutputPrecisionInBits; // // We can just use PowerOf2 Function since output will never be larger then maxOutputPrecisionInBits. // if (overSized <= 1) // { // BigFloat p2 = PowerOf2(val); // // if size difference is 1 BUT the outputSize is still correct just return // if (overSized <= 0 || p2._size == maxOutputPrecisionInBits) // { // return p2; // } // // output is oversized by 1 // return new BigFloat(p2._int, p2.Scale - 1, p2._size); // } // // at this point it is oversized by at least 2 // //oversized by 2 then shrink input by 1 // //oversized by 3 then shrink input by 1 // //oversized by 4 then shrink input by 2 // //oversized by 5 then shrink input by 2 // int inputShrink = (overSized + 1) / 2; // BigInteger valWithLessPrec = val._int >> inputShrink; // BigInteger prod = valWithLessPrec * valWithLessPrec; // int resBitLen = (int)prod.GetBitLength(); // int shrinkBy = resBitLen - val.Size - ExtraHiddenBits; // int sizePart = resBitLen - shrinkBy; // prod = RightShiftWithRound(prod, shrinkBy); // int resScalePart = (2 * val.Scale) + shrinkBy - ExtraHiddenBits; // return new(prod, resScalePart, sizePart); //} public static BigFloat operator *(BigFloat a, BigFloat b) { BigInteger prod; int shouldBe; const int SKIP_IF_SIZE_DIFF_SMALLER = 32; const int KEEP_EXTRA_PREC = 16; //perf: for performance what about no shift when _size's are around the same size. (like within 32) int sizeDiff = a._size - b._size; int shiftBy = Math.Max(0, Math.Abs(sizeDiff) - KEEP_EXTRA_PREC); // for size differences that are: // 0 to 31(SKIP_IF_SIZE_DIFF_SMALLER), no shift takes place (saves time on shift and increases precision on the LSB in rare cases) // > 32, there is a shift of 16 or more (but size difference will be limited to 16 for extra precision) if (Math.Abs(sizeDiff) < SKIP_IF_SIZE_DIFF_SMALLER) { shiftBy = 0; prod = b.DataBits * a.DataBits; shouldBe = Math.Min(a._size, b._size); } else if (sizeDiff > 0) { prod = (a.DataBits >> shiftBy) * b.DataBits; shouldBe = b._size; } else //if (sizeDiff < 0) { prod = (b.DataBits >> shiftBy) * a.DataBits; shouldBe = a._size; } int sizePart = (int)BigInteger.Abs(prod).GetBitLength(); int shrinkBy = sizePart - shouldBe; prod = RightShiftWithRound(prod, shrinkBy, ref sizePart); int resScalePart = a.Scale + b.Scale + shrinkBy + shiftBy - ExtraHiddenBits; BigFloat result = new(prod, resScalePart, sizePart); return result; } public static BigFloat operator /(BigFloat divisor, BigFloat dividend) { // find the size of the smaller input to determine output size int outputSize = Math.Min(divisor.Size, dividend.Size); // If we right-shift divisor to align it with dividend and then divisor < dividend, then we need to decrement the output size. // This is because we would only have a partial bit of precision on the last bit, and it could introduce error. // note: We could also left shift dividend so it is left aligned with divisor but that would be more expensive. (but could be more accurate) // note: We can maybe speed this up by just checking the top 32 or 64 bits of each. if (divisor.DataBits >> (divisor.Size - dividend.Size) <= dividend.DataBits) { outputSize--; } // We need to oversize T (using left shift) so when we divide, it is the correct size. int wantedSizeForT = (1 * dividend.Size) + outputSize + ExtraHiddenBits; int leftShiftTBy = wantedSizeForT - divisor.Size; BigInteger leftShiftedT = divisor.DataBits << leftShiftTBy; // rightShift used here instead of SetPrecisionWithRound for performance // Now we can just divide, and we should have the correct size BigInteger resIntPart = leftShiftedT / dividend.DataBits; int resScalePart = divisor.Scale - dividend.Scale - leftShiftTBy + ExtraHiddenBits; int sizePart = (int)BigInteger.Abs(resIntPart).GetBitLength(); BigFloat result = new(resIntPart, resScalePart, sizePart); return result; } ////////////////////////////////////////////////////////////////////////////////////////////// /////////////////////////////////// implicit CASTS /////////////////////////////////////////// ////////////////////////////////////////////////////////////////////////////////////////////// ///

Defines an implicit conversion of a 8-bit signed integer to a BigFloat.

public static implicit operator BigFloat(sbyte value) { return new BigFloat(value); } ///

Defines an implicit conversion of a 16-bit unsigned integer to a BigFloat.

public static implicit operator BigFloat(ushort value) { return new BigFloat(value); } ///

Defines an implicit conversion of a signed 16-bit integer to a BigFloat.

public static implicit operator BigFloat(short value) { return new BigFloat(value); } ///

Defines an implicit conversion of a 32-bit unsigned integer to a BigFloat.

public static implicit operator BigFloat(uint value) { return new BigFloat(value); } ///

Defines an implicit conversion of a signed 32-bit integer to a BigFloat.

public static implicit operator BigFloat(int value) { return new BigFloat(value); } ///

Defines an implicit conversion of a 64-bit unsigned integer to a BigFloat.

public static implicit operator BigFloat(ulong value) { return new BigFloat(value); } ///

Defines an implicit conversion of a signed 64-bit integer to a BigFloat.

public static implicit operator BigFloat(long value) { return new BigFloat(value); } ///

Defines an implicit conversion of a signed 64-bit integer to a BigFloat.

public static implicit operator BigFloat(UInt128 value) { return new BigFloat(value); } ///

Defines an implicit conversion of a signed 64-bit integer to a BigFloat.

public static implicit operator BigFloat(Int128 value) { return new BigFloat(value); } ////////////////////////////////////////////////////////////////////////////////////////////// /////////////////////////////////// explicit CASTS /////////////////////////////////////////// ////////////////////////////////////////////////////////////////////////////////////////////// /// ///

Defines an explicit conversion of a System.Decimal object to a BigFloat.

//public static explicit operator BigFloat(decimal input) => new BigFloat(input); ///

Defines an explicit conversion of a BigFloat to a unsigned byte.

public static explicit operator byte(BigFloat value) { //return (byte)(value._int << (value.Scale - ExtraHiddenBits)); return (byte)BigFloat.DataIntValueWithRound(value.DataBits << value.Scale); } ///

Defines an explicit conversion of a BigFloat to a signed byte.

public static explicit operator sbyte(BigFloat value) { //return (sbyte)(value._int << (value.Scale - ExtraHiddenBits)); return (sbyte)BigFloat.DataIntValueWithRound(value.DataBits << value.Scale); } ///

Defines an explicit conversion of a BigFloat to a unsigned 16-bit integer. /// The fractional part (including ExtraHiddenBits) are simply discarded.

public static explicit operator ushort(BigFloat value) { //return (ushort)(value._int << (value.Scale - ExtraHiddenBits)); return (ushort)BigFloat.DataIntValueWithRound(value.DataBits << value.Scale); } ///

Defines an explicit conversion of a BigFloat to a 16-bit signed integer. /// The fractional part (including ExtraHiddenBits) are simply discarded.

public static explicit operator short(BigFloat value) { //return (short)(value._int << (value.Scale - ExtraHiddenBits)); return (short)BigFloat.DataIntValueWithRound(value.DataBits << value.Scale); } ///

Defines an explicit conversion of a BigFloat to a unsigned 64-bit integer. /// The fractional part (including ExtraHiddenBits) are simply discarded.

public static explicit operator ulong(BigFloat value) { //return (ulong)(value._int << (value.Scale - ExtraHiddenBits)); return (ulong)BigFloat.DataIntValueWithRound(value.DataBits << value.Scale); } ///

Defines an explicit conversion of a BigFloat to a 64-bit signed integer. /// The fractional part (including ExtraHiddenBits) are simply discarded.

public static explicit operator long(BigFloat value) { //return (long)(value._int << (value.Scale - ExtraHiddenBits)); return (long)BigFloat.DataIntValueWithRound(value.DataBits << value.Scale); } ///

Defines an explicit conversion of a BigFloat to a unsigned 128-bit integer. /// The fractional part (including ExtraHiddenBits) are simply discarded.

public static explicit operator UInt128(BigFloat value) { //return (UInt128)(value._int << (value.Scale - ExtraHiddenBits)); return (UInt128)BigFloat.DataIntValueWithRound(value.DataBits << value.Scale); } ///

Defines an explicit conversion of a BigFloat to a signed 128-bit integer. /// The fractional part (including ExtraHiddenBits) are simply discarded.

public static explicit operator Int128(BigFloat value) { //return (Int128)(value._int << (value.Scale - ExtraHiddenBits)); return (Int128)BigFloat.DataIntValueWithRound(value.DataBits << value.Scale); } ///

/// Casts a BigInteger to a BigFloat. The ExtraHiddenBits are set to zero. /// Example: a BigInteger of 1 would translate to "1+ExtraHiddenBits" bits of precision. ///

/// The BigInteger to cast to a BigFloat. public static explicit operator BigFloat(BigInteger value) { return new BigFloat(value); } ///

Defines an explicit conversion of a System.Double to a BigFloat.

public static explicit operator BigFloat(double value) { return new BigFloat(value); } ///

Defines an explicit conversion of a BigFloat to a Double. /// Caution: Precision is not preserved since double is hard coded with 53 bits of precision.

public static explicit operator double(BigFloat value) { // Future: handle Subnormal numbers (when the exponent field contains all 0's) for anything from 2.2250738585072014 × 10−308 up to 4.9406564584124654E-324. if (value.OutOfPrecision) { return value.IsZero ? 0.0 : double.NaN; } // Aline and move input.val to show top 53 bits then pre-append a "1" bit. // was: long mantissa = (long)(value._int >> (value._size - 53)) ^ ((long)1 << 52); long mantissa = (long)(BigInteger.Abs(value.DataBits) >> (value._size - 53)) ^ ((long)1 << 52); long exp = value.Exponent + 1023 - 1;// + 52 -4; // Check to see if it fits in a normalized double (untested) if (exp <= 0) { return value.IsPositive ? 0 : double.NegativeZero; } if (exp > 2046) { return value.IsPositive ? double.PositiveInfinity : double.NegativeInfinity; } long dubAsLong = mantissa | (exp << 52); //set sign if negative if (value.DataBits.Sign < 0) { dubAsLong ^= (long)1 << 63; } double result = BitConverter.Int64BitsToDouble(dubAsLong); return result; } ///

/// Casts a BigFloat to a BigInteger. The fractional part (including hidden bits) are simply discarded. ///

/// The BigFloat to cast as a BigInteger. public static explicit operator BigInteger(BigFloat value) { return value.DataBits << (value.Scale - ExtraHiddenBits); } ///

Defines an explicit conversion of a BigFloat to a single floating-point. /// Caution: Precision is not preserved since float is hard coded with 26 bits of precision.

public static explicit operator float(BigFloat value) { // Future: handle Subnormal numbers (when the exponent field contains all 0's) for anything from 2.2250738585072014 × 10−308 up to 4.9406564584124654E-324. if (value.OutOfPrecision) { return value.IsZero ? 0.0f : float.NaN; } int mantissa = (int)(BigInteger.Abs(value.DataBits) >> (value._size - 24)) ^ (1 << 23); int exp = value.Exponent + 127 - 1; // Check to see if it fits in a normalized double (untested) if (exp <= 0) { return value.IsPositive ? 0 : float.NegativeZero; } if (exp > 254) { return value.IsPositive ? float.PositiveInfinity : float.NegativeInfinity; } int singleAsInteger = mantissa | (exp << 23); //set sign if negative if (value.DataBits.Sign < 0) { singleAsInteger ^= 1 << 31; } float result = BitConverter.Int32BitsToSingle(singleAsInteger); return result; } ///

Defines an explicit conversion of a System.Single to a BigFloat.

public static explicit operator BigFloat(float value) { return new BigFloat(value); } ///

Defines an explicit conversion of a BigFloat to a 32-bit signed integer.

public static explicit operator int(BigFloat value) { return (int)(value.DataBits << (value.Scale - ExtraHiddenBits)); } ///

Defines an explicit conversion of a BigFloat to a unsigned 32-bit integer input. The fractional part (including hidden bits) are simply discarded.

public static explicit operator uint(BigFloat value) { return (uint)(value.DataBits << (value.Scale - ExtraHiddenBits)); } ///

Checks to see if a BigFloat's value would fit into a normalized double without the exponent overflowing or underflowing. /// Since BigFloats can be any precision and doubles have fixed 53-bits precision, precision is ignored.

public bool FitsInADouble() { // future (possibly): add denormalized support //return (Exponent + 1023 - 1) is not (<= 0 or > 2046); return (Exponent + 1023 - 1) is not (< -52 or > 2046); } /////////////////////////////////// COMPARE FUNCTIONS //////////////////////////////////////////////////////// ///

Returns an input that indicates whether the current instance and a signed 64-bit integer have the same input.

public bool Equals(long other) { //Todo: what about zero? if (Exponent > 64) // 'this' is too large, not possible to be equal. { return false; } else if (Exponent < 0) { return other == 0; } else if (Exponent == 64) { // if 64 bits then 'other' must be long.MinValue as that is the only 64 bit input // any Int of the form "1000"000000000 is also valid if the _scale is set correctly. // return (other == long.MinValue && Int.Equals(long.MinValue)); // short-circuit - if 64 bits then other has to be long.MinValue if (other != long.MinValue) { return false; } //return (Int << _scale) == other; } return Scale >= 0 ? DataBits >> ExtraHiddenBits == other >> Scale : DataBits << (Scale - ExtraHiddenBits) == other; } ///

Returns an input that indicates whether the current instance and an unsigned 64-bit integer have the same input.

public bool Equals(ulong other) { if (Exponent > 64) { return false; // too large } else if (Exponent < 0) { return other == 0; } else if (DataBits.Sign < 0) { return false; // negative } return Scale >= 0 ? DataBits >> ExtraHiddenBits == other >> Scale : DataBits << (Scale - ExtraHiddenBits) == other; } ///

/// Returns true if the integer part of the BigFloat matches 'other'. /// Examples: 1.1 == 1, 1.6 != 1, 0.6==1 ///

public bool Equals(BigInteger other) { return other.Equals(Int); } ///

/// Returns true if the parents BigFloat object have the same value (within the precision). /// Examples: 1.11 == 1.1, 1.00 == 1.0, 1.11 != 1.10, 1.1 == 1.01 ///

public bool Equals(BigFloat other) { return CompareTo(other) == 0; } ///

/// Returns true if the parent's BigFloat value has the same value of the object considering their precisions. ///

public override bool Equals(object obj) { //Check for null and compare run-time types. if (obj == null || !GetType().Equals(obj.GetType())) { return false; } BigFloat p = (BigFloat)obj; return Equals(p); //todo: to test } ///

Returns a 32-bit signed integer hash code for the current BigFloat object.

public override int GetHashCode() { return DataIntValueWithRound(DataBits).GetHashCode() ^ Scale; } //////////////////////////////////////////////////////////////////////////////////////////// //////////////////////////////// MATH FUNCTIONS //////////////////////////////////////////// //////////////////////////////////////////////////////////////////////////////////////////// ///

/// Calculates the square root of a big floating point number. ///

/// The input. /// (Optional)The number of in-precision bits to return. /// Returns the Sqrt of x as a BigFloat. public static BigFloat Sqrt(BigFloat x0, int wantedPrecision = 0) { BigFloat x = x0;// new BigFloat(x0.Int*8, x0._scale-3); if (wantedPrecision == 0) { wantedPrecision = x._size - ExtraHiddenBits; } if (x.DataBits == 0) { return new BigFloat((BigInteger)0, wantedPrecision, 0); } // Output should be (_int.GetBitLength()/2)+16 int totalLen = x.Scale + (x._size - ExtraHiddenBits); int needToShiftInputBy = (2 * wantedPrecision) - (x._size - ExtraHiddenBits) - (totalLen & 1); BigInteger intPart = NewtonPlusSqrt(x.DataBits << (needToShiftInputBy + ExtraHiddenBits)); int retShift = ((totalLen + (totalLen > 0 ? 1 : 0)) / 2) - wantedPrecision; BigFloat result = new(intPart, retShift, (int)intPart.GetBitLength()); //new version 2022-11-12 return result; } // The world's fastest sqrt for C# and Java. // https://www.codeproject.com/Articles/5321399/NewtonPlus-A-Fast-Big-Number-Square-Root-Function private static BigInteger NewtonPlusSqrt(BigInteger x) { if (x < 144838757784765629) // 1.448e17 = ~1<<57 { uint vInt = (uint)Math.Sqrt((ulong)x); if (x >= 4503599761588224 && (ulong)vInt * vInt > (ulong)x) // 4.5e15 = ~1<<52 { vInt--; } return vInt; } double xAsDub = (double)x; if (xAsDub < 8.5e37) // long.max*long.max { ulong vInt = (ulong)Math.Sqrt(xAsDub); BigInteger v = (vInt + (ulong)(x / vInt)) >> 1; return v * v <= x ? v : v - 1; } if (xAsDub < 4.3322e127) { BigInteger v = (BigInteger)Math.Sqrt(xAsDub); v = (v + (x / v)) >> 1; if (xAsDub > 2e63) { v = (v + (x / v)) >> 1; } return v * v <= x ? v : v - 1; } int xLen = (int)x.GetBitLength(); int wantedPrecision = (xLen + 1) / 2; int xLenMod = xLen + (xLen & 1) + 1; //////// Do the first Sqrt on hardware //////// long tempX = (long)(x >> (xLenMod - 63)); double tempSqrt1 = Math.Sqrt(tempX); ulong valLong = (ulong)BitConverter.DoubleToInt64Bits(tempSqrt1) & 0x1fffffffffffffL; if (valLong == 0) { valLong = 1UL << 53; } //////// Classic Newton Iterations //////// BigInteger val = ((BigInteger)valLong << 52) + ((x >> (xLenMod - (3 * 53))) / valLong); int size = 106; for (; size < 256; size <<= 1) { val = (val << (size - 1)) + ((x >> (xLenMod - (3 * size))) / val); } if (xAsDub > 4e254) // 4e254 = 1<<845.76973610139 { int numOfNewtonSteps = BitOperations.Log2((uint)(wantedPrecision / size)) + 2; ////// Apply Starting Size //////// int wantedSize = (wantedPrecision >> numOfNewtonSteps) + 2; int needToShiftBy = size - wantedSize; val >>= needToShiftBy; size = wantedSize; do { //////// Newton Plus Iterations //////// int shiftX = xLenMod - (3 * size); BigInteger valSqrd = (val * val) << (size - 1); BigInteger valSU = (x >> shiftX) - valSqrd; val = (val << size) + (valSU / val); size *= 2; } while (size < wantedPrecision); } /////// There are a few extra digits here, let's save them. /////// int oversizedBy = size - wantedPrecision; //////// Shrink result to wanted Precision //////// val >>= oversizedBy; return val; } ///

/// Returns the inverse of a BigFloat. ///

public static BigFloat Inverse(BigFloat x) { // We need to oversize T (using left shift) so when we divide, it is the correct size. int leftShiftTBy = 2 * (x._size - 1); BigInteger one = BigInteger.One << leftShiftTBy; // Now we can just divide, and we should have the correct size BigInteger resIntPart = one / x.DataBits; //int resScalePartOrig = x._size - x.Scale - leftShiftTBy + ExtraHiddenBits; int resScalePart = -x.Scale - leftShiftTBy + ExtraHiddenBits + ExtraHiddenBits; //int resScalePart2 = x._size - (x.Scale*2) - leftShiftTBy + ExtraHiddenBits - 1; int sizePart = (int)BigInteger.Abs(resIntPart).GetBitLength(); BigFloat result = new(resIntPart, resScalePart, sizePart); return result; } ///

/// Calculates the a BigFloat as the base and an integer as the exponent. The integer part is treated as exact. ///

/// The base of the exponent. /// The number of times value should be multiplied. /// When true, output precision is matched to input precision. When false, precision uses exponent rules based on "value^exp ± exp*error^(n-1)". public static BigFloat Pow(BigFloat value, int exponent, bool outPrecisionMatchesInput = false) { uint pwr = (uint)Math.Abs(exponent); if (pwr < 3) { return exponent switch { 0 => BigFloat.One, //new BigFloat(BigInteger.One >> value.Scale, value.Scale), 1 => value, -1 => Inverse(value), 2 => value * value, _ /*-2*/ => Inverse(value * value) }; } // Used a Genetic Algorithm in Excel to figure out the formula's below (2 options) int expectedFinalPrecision = value._size; if (outPrecisionMatchesInput) { expectedFinalPrecision += /*(int)(power / (1 - value)) -*/ BitOperations.Log2(pwr); // the first part is only for smaller values with large exponents } // if the input precision is <53 bits AND the output will not overflow THEN we can fit this in a double. if (expectedFinalPrecision < 53) { // Lets first make sure we would have some precision remaining after our exponent operation. if (expectedFinalPrecision <= 0) { return ZeroWithNoPrecision; // technically more of a "NA". } //bool expOverflows = value.Exponent < -1022 || value.Exponent > 1023; int removedExp = value.Exponent - 1; // todo: can be improved without using BigFloat (See Pow(BigInteger,BigInteger) below) double valAsDouble = (double)new BigFloat(value.DataBits, value.Scale - removedExp, true); //or just "1-_size"? (BigFloat should be between 1 and 2) //// if final result's scale would not fit in a double. //int finalSizeWillBe = (int)(power * double.Log2(double.Abs(valAsDouble))); //bool finalResultsScaleFitsInDouble = finalSizeWillBe < 1020; // should be <1023, but using 1020 for safety //if (!finalResultsScaleFitsInDouble) // valAsDouble = (double)new BigFloat(value._int, value.Scale - removedExp, true); //or just "1-_size"? (BigFloat should be between 1 and 2) // perform opp double res = double.Pow(valAsDouble, exponent); BigFloat tmp = (BigFloat)res; value = SetPrecision(tmp, expectedFinalPrecision - ExtraHiddenBits); // restore Scale value = new BigFloat(value.DataBits, value.Scale + (removedExp * exponent), true); return value; } // the expectedFinalPrecision >= 53 bits and Power >= 3, so pretty big. // for each bit in the exponent, we need to multiply in 2^position int powerBitCount = BitOperations.Log2(pwr) + 1; // First Loop BigFloat product = ((pwr & 1) == 1) ? value : BigFloat.OneWithAccuracy(value.Size); BigFloat powers = value; for (int i = 1; i < powerBitCount; i++) { powers = PowerOf2(powers); if (((pwr >> i) & 1) == 1) // bit is set { product *= powers; } } if (exponent < 0) { product = Inverse(product); } //product.DebugPrint("bf1"); return product; } //future: Create BigFloat version of PowMostSignificantBits() //todo: set to private ///

/// Returns the top n bits for a BigInteger raised to a power. /// If is not specified, the output precision will match . /// The number of removed bits are returned in in totalShift. /// The returned result, left shifted by , would return the actual result. /// The result is rounded using the top most removed bit. /// When the result is rounded in some borderline cases (e.g. 100|011111), the result can occasionally /// round-up. When it rounds-up, it will be in the upward direction only. This is less likely /// if is true. There are no known rounding errors at this time with enabled. ///

/// The input value. /// The input values size. This can be left at zero if unknown. /// The exponent to raise the value by. /// (out) The number of bits that were removed from the result. /// The number of bits to return. A unspecified value or a value less then 0 will default /// to the inputs size. A value too large will be limited to . /// When false, about 1-in-4096 will round up when it shouldn't. When true, accuracy /// is much better but performance is slower. /// The top bits val raised to the power of exp. public static BigInteger PowMostSignificantBits(BigInteger val, int exp, out int totalShift, int valSize = -1, int wantedBits = 0, bool extraAccurate = false, bool roundDown = false) { totalShift = 0; if (valSize <= 0) { if (val.IsZero) { return BigInteger.Zero; } valSize = (int)val.GetBitLength(); } else { #if DEBUG // Make sure the supplied valSize size is set correctly. Debug.Assert(BigInteger.Abs(val).GetBitLength() == valSize, $"The supplied {nameof(valSize)} is not correct."); #endif } // Lets make sure the number of wanted bits is valid. if (wantedBits == 0) { wantedBits = valSize; } else if (wantedBits > valSize) { // 3 choices: // A) either shrink wanted bits to valSize //wantedBits = valSize; // B) or, make val larger int growBy = wantedBits - valSize; val <<= growBy; valSize += growBy; totalShift = -growBy * exp; // C) or, just throw an error //throw new OverflowException("The val's size is less then the wantedBits."); } if (((long)exp * valSize) >= int.MaxValue) { throw new OverflowException("Overflow: The output 'totalShift' would be too large to fit in an 'int'. (exp * size > int.maxSize"); } int workingSize; int expSz = BitOperations.Log2((uint)exp) + 1; if (extraAccurate) { // This version is more accurate but is slower. There is just one known incident when it does not round up like it should. // JUST ONE KNOWN ROUND ERROR between 16 to 20 is 51^17938 (no known rounding error when extraPrecisionBits is above 20) // searches @16: (1-2000)^(2-39,999), (1-126,000)^(2-3999), (1-134,654,818)^(1-1500) workingSize = (2 * wantedBits) + expSz + 22/*extraPrecisionBits(adjustable)*/; } else { // Odds of an incorrect round-up(ex: 7.50001 not rounding up to 8) ~= 18.12/(2^ExtraBits) // 0=18.1%; 1=9.1%; 2=4.5%; 3=2.3%; 4=1.1%; 5=0.6%; 8=1/4096 workingSize = wantedBits + expSz + 8/*extraPrecisionBits(adjustable)*/; } if (exp < 3) { BigInteger result; switch (exp) { case 0: result = BigInteger.One; //totalShift = 0 break; case 1: totalShift = valSize - wantedBits; if (roundDown) { result = RightShiftWithRound(val, totalShift); } else { bool carried1 = RightShiftWithRoundWithCarryDownsize(out result, val, totalShift, valSize); if (carried1) { totalShift++; } } break; case 2: BigInteger sqr = val * val; int sqrSize = (2 * valSize) - ((sqr >> ((2 * valSize) - 1) > 0) ? 0 : 1); totalShift = sqrSize - wantedBits; if (roundDown) { result = RightShiftWithRound(val, totalShift); } else { bool carried1 = RightShiftWithRoundWithCarryDownsize(out result, sqr, totalShift, sqrSize); if (carried1) { totalShift++; } } break; default: // negative exp would be less then 1 (unless 1) result = val != 1 ? BigInteger.Zero : val.Sign; break; } return result; } // if the input precision is <53 bits AND the output will not overflow THEN we can fit this in a double. if ((wantedBits > 2) && (wantedBits < 53) && (valSize * exp) < 3807) { //// Lets first make sure we would have some precision remaining after our exponent operation. if (valSize == 0) { return BigInteger.Zero; // technically more of a "NA". } // 1) create a double with the bits. // Aline input to the top 53 bits then pre-append a "1" bit. long inMantissa = (long)(BigInteger.Abs(val) << (53 - valSize)); long dubAsLong = inMantissa | ((long)1023 << 52); double normInput = BitConverter.Int64BitsToDouble(dubAsLong); // 2) perform a power double normPow = double.Pow(normInput, exp); if (normPow == double.PositiveInfinity) { throw new OverflowException($"Internal Error: PositiveInfinity valSize:{valSize} exp:{exp} val:{val} wantedBits:{wantedBits}"); } // 3) extract "bottom 52 bits" and that is our answer. long bits = BitConverter.DoubleToInt64Bits(normPow); long outMantissa = (bits & 0xfffffffffffffL) | 0x10000000000000L; int bitsToDrop = 53 - wantedBits; // wantedBits OR size???? long mask1 = ((long)1 << bitsToDrop) - 1; // OR ((long)1 << (53 - size)) - 1 ????? // no known issues if val < 13511613 OR removed bits are not all 1's if ((~(outMantissa & mask1)) >= 0 || val < 13511613) { int outExp = (int)(bits >> 52) - 1023; totalShift += ((valSize - 1) * (exp - 1)) + outExp + (valSize - wantedBits) /*+ (1<<(expSz-2))*/; // outMantissa is 53 in size at this point // we need to Right Shift With Round but if it rounds up to a larger number (e.g. 1111->10000) then we must increment totalShift. bool roundsUp = ((outMantissa >> (bitsToDrop - 1)) & 0x1) > 0; if (!roundsUp) { return outMantissa >> bitsToDrop; } long withRoundUp = (outMantissa >> bitsToDrop) + 1; // if carried to the 54th place then it rolled over and we must shrink by one. if ((withRoundUp >> (53 - bitsToDrop)) > 0) { withRoundUp >>= 1; totalShift++; } return withRoundUp; } } // First Loop BigInteger product = ((exp & 1) > 0) ? val : 1; BigInteger powerPostShift = val; int shiftSum = 0; int shift = 0; // Second Loop BigInteger pwrPreShift = powerPostShift * powerPostShift; int prdSize = (valSize * 2) - (((pwrPreShift >> ((valSize * 2) - 1)) > 0) ? 0 : 1); int H = valSize + prdSize; //OR size + shift int J = ((exp & 0x1) == 1) ? 0 : valSize; int I = 0; powerPostShift = pwrPreShift; if ((exp & 0x2) > 0) { I = H - workingSize; int shrinkSize = I - J; J = 0; product = (product * powerPostShift) >> shrinkSize; totalShift += shrinkSize; } else { J += prdSize; } // for each bit in the exponent, we need to multiply in 2^position for (int i = 2; i < expSz; i++) { pwrPreShift = powerPostShift * powerPostShift; // checks if a leading bit resulted from the multiply and if so adds it. int tmp = ((prdSize - shift) * 2) - 1; prdSize = tmp + (int)(pwrPreShift >> tmp); shift = Math.Max(prdSize - workingSize, 0); H += prdSize - shift - I; //powerPostShift = RightShiftWithRound(pwrPreShift, shift); ///better precision by 1.7 buts but 25% slower powerPostShift = pwrPreShift >> shift; // 25% faster; 5 times more round errors; always one direction(good thing) shiftSum = (shiftSum * 2) + shift; bool bit = ((exp >> i) & 1) == 1; if (bit) { I = H - workingSize; int shrinkSize = I - J; J = 0; product = (product * powerPostShift) >> shrinkSize; totalShift += shrinkSize + shiftSum; } else { I = 0; J += prdSize - shift; //OR shift OR prdSize - shift } } int productSize = (int)product.GetBitLength(); int bitsToRemove = productSize - wantedBits; totalShift += bitsToRemove; bool carry = RightShiftWithRoundWithCarryDownsize(out BigInteger res, product, bitsToRemove, productSize); if (carry) { totalShift++; } return res; } public static BigFloat NthRoot_INCOMPLETE_DRAFT8(BigFloat value, int root) { bool DEBUG = false; //if (DEBUG) Console.WriteLine(); bool rootIsNeg = root < 0; if (rootIsNeg) { root = -root; } bool resultIsPos = value.DataBits.Sign > 0; if (!resultIsPos) { value = -value; } resultIsPos = resultIsPos || ((root & 1) == 0); // Check if Value is zero. if (value.DataBits.Sign == 0) { return BigFloat.ZeroWithSpecifiedLeastPrecision(value.Size); } // Check for common roots... switch (root) { case 0: return OneWithAccuracy(value.Size); case 1: return resultIsPos ? value : -value; //case 2: // return resultIsPos ? Sqrt(value) : -Sqrt(value); //case 4: // return resultIsPos ? Sqrt(Sqrt(value)) : -Sqrt(Sqrt(value)); } //int xLen = value._size; int rootSize = BitOperations.Log2((uint)root); int wantedPrecision = (int)BigInteger.Log2(value.DataBits) + rootSize; // for better accuracy for small roots add: "+ rootSize / Math.Pow(( root >> (rootSize - 3)), root) - 0.5" //BigInteger val; ////////// Lets remove value's scale (and just leave the last bit so scale is 0 or 1) //////// int removedScale = value.Scale & ~1; int newScale = value.Scale - removedScale; ////////// Use double's hardware to get the first 53-bits //////// //long tempX = (long)(value._int >> (value._size - 52 /*- newScale*/ +22)); //////////////////////////////////////////////////////////////////////////// long mantissa = (long)(BigInteger.Abs(value.DataBits) >> (value._size - 53)) ^ ((long)1 << 52); long exp = value.Exponent + 1023 - 1;// + 52 -4; // if exp is oversized for double we need to pull out some exp: if (Math.Abs(value.Exponent) > 1021) // future: using 1021(not 1022) to be safe { // old: (1)Pre: pre=(value<<(preShift*root)) (2)Root: result=pre^(1/root) (3)post: result/(1<>preShift) (2)Root: result=pre^(1/root) (3)post: result/(2^(-preShift/root) //double finalDiv = Math.Pow(2,-value.Exponent/root); exp = 0; } double dubVal = BitConverter.Int64BitsToDouble(mantissa | (exp << 52)); /////////////////////////////////////////////////////////////////////////////////////////////// // todo: what about just casting from BigFloat to double? //double test = Math.Log2(dubVal); //Math.Log2((double)tempX); double tempRoot = Math.Pow(dubVal, 1.0 / root); //Math.Pow(tempX, 1.0/root) ulong bits = (ulong)BitConverter.DoubleToInt64Bits(tempRoot); ulong tempVal = (bits & 0x1fffffffffffffL) | (1UL << 52); int tempExp = (int)((bits >> 52) & 0x7ffL) - 1023 - 20; newScale += tempExp; // If 53 bits enough precision, lets use that and return. //if (value._size < 53) //{ // Shrink result to wanted Precision // int shrinkAmt = (53 - value._size); // BigFloat newVal = new BigFloat(tempVal >> shrinkAmt, newScale + shrinkAmt, value._size); // return newVal; //} BigInteger xVal = tempVal; int x_Scale = newScale; //x_Scale -= 100; //TEMP //xVal <<= 100; //TEMP ////////////////// BigFloat Version //////////////////////////// BigFloat x = new((BigInteger)tempVal << 100, newScale - 100, true); //BigFloat rt = new((BigInteger)root << value.Size, -value.Size); // get a proper sized "root" (only needed for BigFloat version) //BigFloat b = rt * Pow(x, root - 1); // Init the "b" and "t" for "oldX - (t / b)" //BigFloat t = Pow(x, root) - value; //while (t._size > 3) //(!t.OutOfPrecision) //{ // BigFloat oldX = x; // BigFloat tb = t / b; // x -= tb; // if (DEBUG) Console.WriteLine($"{oldX} - ({t} / {b}) = {oldX} - {tb} =\r\n {x}"); // b = rt * Pow(x, root - 1); // t = Pow(x, root) - value; //} //BigFloat usingBigFloats = x; //new BigFloat(xVal, x_Scale, true); BigFloat rt = new((BigInteger)root << value.Size, -value.Size); // get a proper sized "root" (only needed for BigFloat version) BigFloat t = Pow(x, root) - value; if (DEBUG) Console.WriteLine($"F-t: {t.GetMostSignificantBits(196)}[{t._size}]"); BigInteger biPower = PowMostSignificantBits(xVal << 53, root, out _); BigInteger t2 = (value.DataBits << (int)(biPower.GetBitLength() - value.DataBits.GetBitLength())) - biPower; if (DEBUG) Console.WriteLine($"I-t: {BigIntegerToBinaryString(t2)}[{t2.GetBitLength()}]"); BigFloat b = rt * Pow(x, root - 1); if (DEBUG) Console.WriteLine($"F-b: {b.GetMostSignificantBits(196)}[{b._size}]"); BigInteger b2; b2 = root * PowMostSignificantBits(xVal, root - 1, out _, 53, 26); if (DEBUG) Console.WriteLine($"I-b: {BigIntegerToBinaryString(b2)}[{b2.GetBitLength()}]"); // precision: biPower = 53, t2 = 53, b2 = 53, SO tb2 = 53 bits while (xVal.GetBitLength() < 140)//(t2.GetBitLength() > 20)//(t._size > 3) //(!t.OutOfPrecision) { if (DEBUG) Console.WriteLine(); BigFloat oldX = x; BigInteger oldX2 = xVal; BigFloat tb = t / b; if (DEBUG) Console.WriteLine($"F-tb: {tb.GetMostSignificantBits(196)}[{tb._size}]"); BigInteger tb2 = (t2 << 53) / b2; if (DEBUG) Console.WriteLine($"I-tb: {BigIntegerToBinaryString(tb2)}[{tb2.GetBitLength()}]"); x -= tb; if (DEBUG) Console.WriteLine($"F-X: {x.GetMostSignificantBits(196)}[{x._size}]"); xVal = (xVal << ((int)b2.GetBitLength())) + tb2; if (DEBUG) Console.WriteLine($"I-X: {BigIntegerToBinaryString(xVal)}[{xVal.GetBitLength()}]"); if (DEBUG) Console.WriteLine($"Ans: 1100100001011001100000111.11011110011011111000001101101010110010111100111001011101100011110011111011010110111011101001110111110010111011100110101101111001011011000010111000110001001000000010100000110011111101101110011010000001..."); //11001000010110011000001111101111001101111100000110110101011001011110011100100111000010100010010110001001000010011000000101000010101000000000011011011000010111100110010101111011001011011001110001110 if (DEBUG) Console.WriteLine($"Ans: 1100100001011001100000111.11011110011011111000001101101010110010111100111001011101100011110011111011010110111011101001110111110010111011100110101101111001011011000010111000110001000110001111000010001011110100001011001101010000..."); if (DEBUG) Console.WriteLine($"BF:{oldX} - ({t} / {b} [{tb}]) = {x}"); // 1100100001011001100000111.11011110011011111000001101101010110010111100111001011101100011110011111010100000101100101000110010110110000100111101101111110111100001101101110111000000001110100100101011100100000100010101101110000111... // 1100100001011001100000111.11011110011011111000001101101010110010111100111001011101100011110011111010100000101100101000110010110110000100111101101111110111100001101101110111000000001110100100101011100100 // 1100100001011001100000111.11011110011011111000001101101010110010111100111001011101100011110011111011010110111011101001110111110010111011100110101101111001011011000010111000110001001000000010100000110011111101101110011010000001... //Res: 1100100001011001100000111.1101111001101111100000110110101011001011110011100101110110001111001111101111001011 if (DEBUG) Console.WriteLine($"BI:{oldX2} - ({t2} / {b2} [{tb2}]) = {new BigFloat(xVal, x_Scale - 54 - 32)}"); biPower = PowMostSignificantBits(xVal /*<< 100*/, root, out _); if (DEBUG) Console.WriteLine($"F-pow:{Pow(x, root).GetMostSignificantBits(196)}[{Pow(x, root)._size}]"); if (DEBUG) Console.WriteLine($"I-pow:{BigIntegerToBinaryString(biPower)}[{biPower.GetBitLength()}]"); BigInteger val2 = value.DataBits << (int)(biPower.GetBitLength() - value.DataBits.GetBitLength()); if (DEBUG) Console.WriteLine($"F-val:{value.GetMostSignificantBits(196)}[{t._size}]"); if (DEBUG) Console.WriteLine($"I-val:{BigIntegerToBinaryString(val2)}[{val2.GetBitLength()}]"); t = Pow(x, root) - value; if (DEBUG) Console.WriteLine($"F-t: {t.GetMostSignificantBits(196)}[{t._size}]"); t2 = biPower - val2; if (DEBUG) Console.WriteLine($"I-t: {BigIntegerToBinaryString(t2)}[{t2.GetBitLength()}]"); b = rt * Pow(x, root - 1); if (DEBUG) Console.WriteLine($"F-b: {b.GetMostSignificantBits(196)}[{b._size}]"); b2 = root * PowMostSignificantBits(xVal, root - 1, out _); if (DEBUG) Console.WriteLine($"I-b: {BigIntegerToBinaryString(b2)}[{b2.GetBitLength()}]"); // precision: t2 = 106, b2 = 106, SO tb2 = 106 bits BigInteger temp = (t2 << ((2 * wantedPrecision) - (int)t2.GetBitLength())) / b2; if (DEBUG) Console.WriteLine($"I-tb: {BigIntegerToBinaryString(temp)}[{temp.GetBitLength()}]"); } _ = new BigFloat(xVal, x_Scale, true); return x; } [Conditional("DEBUG")] private void AssertValid() { int realSize = (int)BigInteger.Abs(DataBits).GetBitLength(); // Make sure size is set correctly. Zero is allowed to be any size. Debug.Assert(_size == realSize, $"_size({_size}), expected ({realSize})"); } [Conditional("DEBUG")] private static void AssertValid(BigFloat val) { int realSize = (int)BigInteger.Abs(val.DataBits).GetBitLength(); // Make sure size is set correctly. Zero is allowed to be any size. Debug.Assert(val._size == realSize, $"_size({val._size}), expected ({realSize})"); } }