|
30 | 30 | *************************************************************************/
|
31 | 31 |
|
32 | 32 | #include "bcmath.h"
|
| 33 | +#include "convert.h" |
33 | 34 | #include <stdbool.h>
|
34 | 35 | #include <stddef.h>
|
35 | 36 | #include "private.h"
|
@@ -140,53 +141,107 @@ bool bc_sqrt(bc_num *num, size_t scale)
|
140 | 141 | } else {
|
141 | 142 | /* Standard path */
|
142 | 143 |
|
143 |
| - bc_num guess; |
144 |
| - size_t cscale; |
145 |
| - /* Calculate the initial guess. */ |
146 |
| - if (num_cmp_one == BCMATH_RIGHT_GREATER) { |
147 |
| - /* The number is between 0 and 1. Guess should start at 1. */ |
148 |
| - guess = bc_copy_num(BCG(_one_)); |
149 |
| - cscale = (*num)->n_scale; |
| 144 | + /* allocate memory */ |
| 145 | + size_t n_vector_size = BC_ARR_SIZE_FROM_LEN(num_calc_full_len); |
| 146 | + |
| 147 | + size_t guess_len = ((*num)->n_len + 1) / 2; |
| 148 | + size_t guess_scale = rscale + 1; |
| 149 | + size_t guess_full_len = guess_len + guess_scale; |
| 150 | + size_t guess_vector_size = BC_ARR_SIZE_FROM_LEN(guess_full_len) + 1; |
| 151 | + |
| 152 | + size_t allocate_size = n_vector_size * 2 + guess_vector_size * 3; |
| 153 | + BC_VECTOR *buf = safe_emalloc(allocate_size, sizeof(BC_VECTOR), 0); |
| 154 | + |
| 155 | + BC_VECTOR *n_vector = buf; |
| 156 | + BC_VECTOR *n_vector_copy = n_vector + n_vector_size; |
| 157 | + BC_VECTOR *guess_vector = n_vector_copy + n_vector_size; |
| 158 | + BC_VECTOR *guess1_vector = guess_vector + guess_vector_size; |
| 159 | + BC_VECTOR *tmp_div_ret_vector = guess1_vector + guess_vector_size; |
| 160 | + |
| 161 | + /* convert num to n_vector */ |
| 162 | + size_t n_full_len = (*num)->n_len + (*num)->n_scale; |
| 163 | + const char *nend = (*num)->n_value + n_full_len - 1; |
| 164 | + size_t n_extend_zeros = num_calc_full_len - n_full_len; |
| 165 | + |
| 166 | + bc_convert_to_vector_with_zero_pad(n_vector, nend, n_full_len, n_extend_zeros); |
| 167 | + |
| 168 | + /* Prepare guess_vector */ |
| 169 | + for (size_t i = 0; i < guess_vector_size - 2; i++) { |
| 170 | + guess_vector[i] = BC_VECTOR_BOUNDARY_NUM - 1; |
| 171 | + } |
| 172 | + if (guess_full_len % BC_VECTOR_SIZE == 0) { |
| 173 | + guess_vector[guess_vector_size - 2] = BC_VECTOR_BOUNDARY_NUM - 1; |
150 | 174 | } else {
|
151 |
| - /* The number is greater than 1. Guess should start at 10^(exp/2). */ |
152 |
| - /* If just divide size_t by 2 it will not overflow. */ |
153 |
| - size_t exponent_for_initial_guess = (size_t) (*num)->n_len >> 1; |
154 |
| - |
155 |
| - /* 10^n is a 1 followed by n zeros. */ |
156 |
| - guess = bc_new_num(exponent_for_initial_guess + 1, 0); |
157 |
| - guess->n_value[0] = 1; |
158 |
| - cscale = 3; |
| 175 | + guess_vector[guess_vector_size - 2] = 0; |
| 176 | + for (size_t i = 0; i < guess_full_len % BC_VECTOR_SIZE; i++) { |
| 177 | + guess_vector[guess_vector_size - 2] *= BASE; |
| 178 | + guess_vector[guess_vector_size - 2] += 9; |
| 179 | + } |
159 | 180 | }
|
| 181 | + guess_vector[guess_vector_size - 1] = 0; |
| 182 | + guess1_vector[guess_vector_size - 1] = 0; |
| 183 | + |
| 184 | + size_t quot_size = n_vector_size - (guess_vector_size - 1) + 1; |
160 | 185 |
|
161 |
| - bc_num guess1 = NULL; |
162 |
| - bc_num point5 = bc_new_num (1, 1); |
163 |
| - point5->n_value[1] = 5; |
164 |
| - bc_num diff = NULL; |
| 186 | + BC_VECTOR two[1] = { 2 }; |
165 | 187 |
|
| 188 | + /* Newton's algorithm. */ |
166 | 189 | bool done = false;
|
167 |
| - while (!done) { |
168 |
| - bc_free_num (&guess1); |
169 |
| - guess1 = bc_copy_num(guess); |
170 |
| - bc_divide(*num, guess, &guess, cscale); |
171 |
| - bc_add_ex(guess, guess1, &guess, 0); |
172 |
| - bc_multiply_ex(guess, point5, &guess, cscale); |
173 |
| - bc_sub_ex(guess, guess1, &diff, cscale + 1); |
174 |
| - if (bc_is_near_zero(diff, cscale)) { |
175 |
| - if (cscale < rscale + 1) { |
176 |
| - cscale = MIN (cscale * 3, rscale + 1); |
| 190 | + do { |
| 191 | + for (size_t i = 0; i < n_vector_size; i++) { |
| 192 | + n_vector_copy[i] = n_vector[i]; |
| 193 | + } |
| 194 | + bool div_ret = bc_divide_vector(n_vector_copy, n_vector_size, guess_vector, guess_vector_size - 1, tmp_div_ret_vector, quot_size); |
| 195 | + ZEND_ASSERT(div_ret); |
| 196 | + |
| 197 | + BC_VECTOR *tmp_vptr = guess1_vector; |
| 198 | + guess1_vector = guess_vector; |
| 199 | + guess_vector = tmp_vptr; |
| 200 | + int carry = 0; |
| 201 | + for (size_t i = 0; i < guess_vector_size - 1; i++) { |
| 202 | + guess_vector[i] = guess1_vector[i] + tmp_div_ret_vector[i] + carry; |
| 203 | + if (guess_vector[i] >= BC_VECTOR_BOUNDARY_NUM) { |
| 204 | + guess_vector[i] -= BC_VECTOR_BOUNDARY_NUM; |
| 205 | + carry = 1; |
177 | 206 | } else {
|
178 |
| - done = true; |
| 207 | + carry = 0; |
179 | 208 | }
|
180 | 209 | }
|
181 |
| - } |
| 210 | + guess_vector[guess_vector_size - 1] = carry; |
182 | 211 |
|
183 |
| - /* Assign the number and clean up. */ |
184 |
| - bc_free_num (num); |
185 |
| - bc_divide(guess, BCG(_one_), num, rscale); |
186 |
| - bc_free_num (&guess); |
187 |
| - bc_free_num (&guess1); |
188 |
| - bc_free_num (&point5); |
189 |
| - bc_free_num (&diff); |
| 212 | + div_ret = bc_divide_vector(guess_vector, guess_vector_size, two, 1, tmp_div_ret_vector, guess_vector_size); |
| 213 | + ZEND_ASSERT(div_ret); |
| 214 | + |
| 215 | + for (size_t i = 0; i < guess_vector_size; i++) { |
| 216 | + guess_vector[i] = tmp_div_ret_vector[i]; |
| 217 | + } |
| 218 | + |
| 219 | + size_t diff = guess_vector[0] > guess1_vector[0] ? guess_vector[0] - guess1_vector[0] : guess1_vector[0] - guess_vector[0]; |
| 220 | + if (diff <= 1) { |
| 221 | + bool is_same = true; |
| 222 | + for (size_t i = 1; i < guess_vector_size - 1; i++) { |
| 223 | + if (guess_vector[i] != guess1_vector[i]) { |
| 224 | + is_same = false; |
| 225 | + break; |
| 226 | + } |
| 227 | + } |
| 228 | + done = is_same; |
| 229 | + } |
| 230 | + } while (!done); |
| 231 | + |
| 232 | + bc_num ret = bc_new_num_nonzeroed(guess_len, guess_scale); |
| 233 | + char *rptr = ret->n_value; |
| 234 | + char *rend = rptr + guess_full_len - 1; |
| 235 | + |
| 236 | + bc_convert_vector_to_char(guess_vector, rptr, rend, guess_vector_size - 1); |
| 237 | + |
| 238 | + ret->n_scale = rscale; |
| 239 | + _bc_rm_leading_zeros(ret); |
| 240 | + |
| 241 | + bc_free_num(num); |
| 242 | + *num = ret; |
| 243 | + |
| 244 | + efree(buf); |
190 | 245 | }
|
191 | 246 |
|
192 | 247 | return true;
|
|
0 commit comments