Skip to content

Commit 45ce75d

Browse files
committed
Optimized standard path calculation
1 parent 7b52a0a commit 45ce75d

File tree

3 files changed

+125
-41
lines changed

3 files changed

+125
-41
lines changed

ext/bcmath/libbcmath/src/div.c

Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -429,3 +429,27 @@ bool bc_divide(bc_num numerator, bc_num divisor, bc_num *quot, size_t scale)
429429
*quot = bc_copy_num(BCG(_zero_));
430430
return true;
431431
}
432+
433+
bool bc_divide_vector(
434+
BC_VECTOR *numerator_vectors, size_t numerator_arr_size,
435+
const BC_VECTOR *divisor_vectors, size_t divisor_arr_size,
436+
BC_VECTOR *quot_vectors, size_t quot_arr_size
437+
) {
438+
ZEND_ASSERT(divisor_vectors[divisor_arr_size - 1] != 0);
439+
ZEND_ASSERT(quot_arr_size == numerator_arr_size - divisor_arr_size + 1);
440+
441+
size_t divisor_size = (divisor_arr_size - 1) * BC_VECTOR_SIZE;
442+
BC_VECTOR tmp_divisor_top = divisor_vectors[divisor_arr_size - 1];
443+
while (tmp_divisor_top > 0) {
444+
divisor_size++;
445+
tmp_divisor_top /= BASE;
446+
}
447+
448+
/* Do the division */
449+
if (divisor_arr_size == 1) {
450+
bc_fast_div(numerator_vectors, numerator_arr_size, divisor_vectors[0], quot_vectors, quot_arr_size);
451+
} else {
452+
bc_standard_div(numerator_vectors, numerator_arr_size, divisor_vectors, divisor_arr_size, divisor_size, quot_vectors, quot_arr_size);
453+
}
454+
return true;
455+
}

ext/bcmath/libbcmath/src/private.h

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -87,6 +87,10 @@ bc_num _bc_do_sub (bc_num n1, bc_num n2);
8787
void bc_multiply_vector(
8888
const BC_VECTOR *n1_vector, size_t n1_arr_size, const BC_VECTOR *n2_vector, size_t n2_arr_size,
8989
BC_VECTOR *prod_vector, size_t prod_arr_size);
90+
bool bc_divide_vector(
91+
BC_VECTOR *numerator_vectors, size_t numerator_arr_size,
92+
const BC_VECTOR *divisor_vectors, size_t divisor_arr_size,
93+
BC_VECTOR *quot_vectors, size_t quot_arr_size);
9094
void _bc_rm_leading_zeros (bc_num num);
9195

9296
#endif

ext/bcmath/libbcmath/src/sqrt.c

Lines changed: 97 additions & 41 deletions
Original file line numberDiff line numberDiff line change
@@ -30,6 +30,7 @@
3030
*************************************************************************/
3131

3232
#include "bcmath.h"
33+
#include "convert.h"
3334
#include <stdbool.h>
3435
#include <stddef.h>
3536
#include "private.h"
@@ -111,55 +112,111 @@ static inline void bc_fast_sqrt(bc_num *num, size_t rscale)
111112
*num = ret;
112113
}
113114

114-
static inline void bc_standard_sqrt(bc_num *num, size_t rscale, bcmath_compare_result num_cmp_one)
115+
static inline void bc_standard_sqrt(bc_num *num, size_t rscale, size_t num_calc_full_len)
115116
{
116-
bc_num guess;
117-
size_t cscale;
118-
/* Calculate the initial guess. */
119-
if (num_cmp_one == BCMATH_RIGHT_GREATER) {
120-
/* The number is between 0 and 1. Guess should start at 1. */
121-
guess = bc_copy_num(BCG(_one_));
122-
cscale = (*num)->n_scale;
117+
/* allocate memory */
118+
size_t n_vector_size = BC_ARR_SIZE_FROM_LEN(num_calc_full_len);
119+
120+
size_t guess_len = ((*num)->n_len + 1) / 2;
121+
size_t guess_scale = rscale + 1;
122+
size_t guess_full_len = guess_len + guess_scale;
123+
/* Since add the old guess and the new guess together during the calculation,
124+
* there is a chance of overflow, so allocate an extra size. */
125+
size_t guess_vector_size = BC_ARR_SIZE_FROM_LEN(guess_full_len) + 1;
126+
127+
size_t allocate_size = n_vector_size * 2 + guess_vector_size * 3;
128+
BC_VECTOR *buf = safe_emalloc(allocate_size, sizeof(BC_VECTOR), 0);
129+
130+
BC_VECTOR *n_vector = buf;
131+
BC_VECTOR *n_vector_copy = n_vector + n_vector_size;
132+
BC_VECTOR *guess_vector = n_vector_copy + n_vector_size;
133+
BC_VECTOR *guess1_vector = guess_vector + guess_vector_size;
134+
BC_VECTOR *tmp_div_ret_vector = guess1_vector + guess_vector_size;
135+
136+
/* convert num to n_vector */
137+
size_t n_full_len = (*num)->n_len + (*num)->n_scale;
138+
const char *nend = (*num)->n_value + n_full_len - 1;
139+
size_t n_extend_zeros = num_calc_full_len - n_full_len;
140+
141+
bc_convert_to_vector_with_zero_pad(n_vector, nend, n_full_len, n_extend_zeros);
142+
143+
/* Prepare guess_vector (Temporary implementation) */
144+
for (size_t i = 0; i < guess_vector_size - 2; i++) {
145+
guess_vector[i] = BC_VECTOR_BOUNDARY_NUM - 1;
146+
}
147+
if (guess_full_len % BC_VECTOR_SIZE == 0) {
148+
guess_vector[guess_vector_size - 2] = BC_VECTOR_BOUNDARY_NUM - 1;
123149
} else {
124-
/* The number is greater than 1. Guess should start at 10^(exp/2). */
125-
/* If just divide size_t by 2 it will not overflow. */
126-
size_t exponent_for_initial_guess = (size_t) (*num)->n_len >> 1;
127-
128-
/* 10^n is a 1 followed by n zeros. */
129-
guess = bc_new_num(exponent_for_initial_guess + 1, 0);
130-
guess->n_value[0] = 1;
131-
cscale = 3;
150+
guess_vector[guess_vector_size - 2] = 0;
151+
for (size_t i = 0; i < guess_full_len % BC_VECTOR_SIZE; i++) {
152+
guess_vector[guess_vector_size - 2] *= BASE;
153+
guess_vector[guess_vector_size - 2] += 9;
154+
}
132155
}
156+
guess_vector[guess_vector_size - 1] = 0;
157+
guess1_vector[guess_vector_size - 1] = 0;
158+
159+
size_t quot_size = n_vector_size - (guess_vector_size - 1) + 1;
133160

134-
bc_num guess1 = NULL;
135-
bc_num point5 = bc_new_num (1, 1);
136-
point5->n_value[1] = 5;
137-
bc_num diff = NULL;
161+
BC_VECTOR two[1] = { 2 };
138162

163+
/* Newton's algorithm. */
139164
bool done = false;
140-
while (!done) {
141-
bc_free_num (&guess1);
142-
guess1 = bc_copy_num(guess);
143-
bc_divide(*num, guess, &guess, cscale);
144-
bc_add_ex(guess, guess1, &guess, 0);
145-
bc_multiply_ex(guess, point5, &guess, cscale);
146-
bc_sub_ex(guess, guess1, &diff, cscale + 1);
147-
if (bc_is_near_zero(diff, cscale)) {
148-
if (cscale < rscale + 1) {
149-
cscale = MIN (cscale * 3, rscale + 1);
165+
do {
166+
for (size_t i = 0; i < n_vector_size; i++) {
167+
n_vector_copy[i] = n_vector[i];
168+
}
169+
bool div_ret = bc_divide_vector(n_vector_copy, n_vector_size, guess_vector, guess_vector_size - 1, tmp_div_ret_vector, quot_size);
170+
ZEND_ASSERT(div_ret);
171+
172+
BC_VECTOR *tmp_vptr = guess1_vector;
173+
guess1_vector = guess_vector;
174+
guess_vector = tmp_vptr;
175+
int carry = 0;
176+
for (size_t i = 0; i < guess_vector_size - 1; i++) {
177+
guess_vector[i] = guess1_vector[i] + tmp_div_ret_vector[i] + carry;
178+
if (guess_vector[i] >= BC_VECTOR_BOUNDARY_NUM) {
179+
guess_vector[i] -= BC_VECTOR_BOUNDARY_NUM;
180+
carry = 1;
150181
} else {
151-
done = true;
182+
carry = 0;
152183
}
153184
}
154-
}
185+
guess_vector[guess_vector_size - 1] = carry;
186+
187+
div_ret = bc_divide_vector(guess_vector, guess_vector_size, two, 1, tmp_div_ret_vector, guess_vector_size);
188+
ZEND_ASSERT(div_ret);
189+
190+
for (size_t i = 0; i < guess_vector_size; i++) {
191+
guess_vector[i] = tmp_div_ret_vector[i];
192+
}
155193

156-
/* Assign the number and clean up. */
157-
bc_free_num (num);
158-
bc_divide(guess, BCG(_one_), num, rscale);
159-
bc_free_num (&guess);
160-
bc_free_num (&guess1);
161-
bc_free_num (&point5);
162-
bc_free_num (&diff);
194+
size_t diff = guess_vector[0] > guess1_vector[0] ? guess_vector[0] - guess1_vector[0] : guess1_vector[0] - guess_vector[0];
195+
if (diff <= 1) {
196+
bool is_same = true;
197+
for (size_t i = 1; i < guess_vector_size - 1; i++) {
198+
if (guess_vector[i] != guess1_vector[i]) {
199+
is_same = false;
200+
break;
201+
}
202+
}
203+
done = is_same;
204+
}
205+
} while (!done);
206+
207+
bc_num ret = bc_new_num_nonzeroed(guess_len, guess_scale);
208+
char *rptr = ret->n_value;
209+
char *rend = rptr + guess_full_len - 1;
210+
211+
bc_convert_vector_to_char(guess_vector, rptr, rend, guess_vector_size - 1);
212+
213+
ret->n_scale = rscale;
214+
_bc_rm_leading_zeros(ret);
215+
216+
bc_free_num(num);
217+
*num = ret;
218+
219+
efree(buf);
163220
}
164221

165222
bool bc_sqrt(bc_num *num, size_t scale)
@@ -192,8 +249,7 @@ bool bc_sqrt(bc_num *num, size_t scale)
192249
if (num_calc_full_len < MAX_LENGTH_OF_LONG) {
193250
bc_fast_sqrt(num, rscale);
194251
} else {
195-
bc_standard_sqrt(num, rscale, num_cmp_one);
252+
bc_standard_sqrt(num, rscale, num_calc_full_len);
196253
}
197-
198254
return true;
199255
}

0 commit comments

Comments
 (0)