#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <math.h>
const uint32_t RADIX = 10000;
const double pi = 3.1415926535897932385;
double cos1;
double sin1;
void fr(double *s1,double *s2,double *end,size_t add,size_t t90){
for(;s1<end;s1+=add,s2+=add){
double r0,r1,r2,r3,m0,m1;
r0=s1[0];
r1=s2[0];
r2=s1[t90];
r3=s2[t90];
m0=r2*cos1-r3*sin1;
m1=r2*sin1+r3*cos1;
s1[0] = r0+m0;
s2[0] = r0-m0;
s1[t90] =-r1+m1;
s2[t90] = r1+m1;
}
}
void fri(double *s1,double *s2,double *end,size_t add,size_t t90){
for(;s1<end;s1+=add,s2+=add){
double r0,r1,r2,r3,m0,m1,m2,m3;
r0=s1[0];
r1=s2[0];
r2=s1[t90];
r3=s2[t90];
m0= r0+r1;
m1=-r2+r3;
m2= r0-r1;
m3= r2+r3;
s1[0] = m0;
s2[0] = m1;
s1[t90] = m2*cos1+m3*sin1;
s2[t90] =-m2*sin1+m3*cos1;
}
}
void fr0(double *s1,double *end,size_t add,size_t t90){
for(;s1<end;s1+=add){
double r0,r1;
r0=s1[0];
r1=s1[t90];
s1[0] =r0+r1;
s1[t90] =r0-r1;
}
}
void swap_d(double *a, double *b) {
double t = *a;
*a = *b;
*b = t;
}
void bxchg(double *s,int p){
size_t t4, t5, t6;
size_t t045, t090, t180, t270;
t045 = (size_t)1<<p-3;
t090 = t045 + t045;
t180 = t090 + t090;
t270 = t180 + t090;
t4 = t090 - 4;
t5 = t4;
do {
swap_d(&s[t4+1], &s[t180+t5]);
swap_d(&s[t4+2], &s[t090+t5]);
swap_d(&s[t4+3], &s[t270+t5]);
swap_d(&s[t090+t4+1], &s[t180+t5+2]);
swap_d(&s[t090+t4+3], &s[t270+t5+2]);
swap_d(&s[t180+t4+3], &s[t270+t5+1]);
if(t4 < t5){
swap_d(&s[t4], &s[t5]);
swap_d(&s[t090+t4+2], &s[t090+t5+2]);
swap_d(&s[t180+t4+1], &s[t180+t5+1]);
swap_d(&s[t270+t4+3], &s[t270+t5+3]);
}
if (t4 == 0){
break;
}
t4 -= 4;
t6 = t045;
for(;;){
t5 ^= t6;
if((t5 & t6) == 0){
break;
}
t6 >>= 1;
}
} while (1);
}
void bitexchg(double *s,int p){
if (p <= 1){
}
else if (p == 2){
swap_d(&s[1],&s[2]);
}
else if (p == 3){
swap_d(&s[1],&s[4]);
swap_d(&s[3],&s[6]);
}
else {
bxchg(s,p);
}
}
double* SIN_TABLE[64] = {0};
const double* sin_table(int p){
if (p >= 2 && SIN_TABLE[p] == 0){
size_t t090 = (size_t)1<<p-2;
SIN_TABLE[p] = (double*)malloc(t090*sizeof(double));
double k = 0.5 * pi / t090;
for (int i = 0 ; i < t090 ; i++){
SIN_TABLE[p][i] = sin(k * i);
}
}
return SIN_TABLE[p];
}
void fouri(double *s, int p){
const double* table = sin_table(p);
bitexchg(s,p);
size_t q = (size_t)1<<p;
for (int i = 1;i <= p; i++){
size_t r360 = (size_t)1<<i;
size_t r180 = r360 / 2;
size_t r090 = r180 / 2;
size_t k1 = 0;
size_t k2 = r180 - 1;
fr0(&s[0], &s[q], r360, r180);
k1 ++;
size_t t0 = (size_t)1<<p-i;
size_t t1 = ((size_t)1<<p-2) - t0;
size_t t2 = (size_t)1<<p-i;
for (;k1 < r090;k1 ++,k2 --){
sin1 = table[t0];
cos1 = table[t1];
fr(&s[k1], &s[k2], &s[q], r360, r180);
t0 += t2;
t1 -= t2;
}
}
}
void fouriinv(double *s, int p){
const double* table = sin_table(p);
size_t q = (size_t)1<<p;
for (int i = p;i >= 1; i--){
size_t r360 = (size_t)1<<i;
size_t r180 = r360 / 2;
size_t r090 = r180 / 2;
size_t k1 = 0;
size_t k2 = r180 - 1;
fr0(&s[0], &s[q], r360, r180);
k1 ++;
size_t t0 = (size_t)1<<p-i;
size_t t1 = ((size_t)1<<p-2) - t0;
size_t t2 = (size_t)1<<p-i;
for (;k1 < r090;k1 ++,k2 --){
sin1 = table[t0];
cos1 = table[t1];
fri(&s[k1], &s[k2], &s[q], r360, r180);
t0 += t2;
t1 -= t2;
}
}
bitexchg(s,p);
}
int s2p(uint64_t s) {
int i;
for (i = 0; i < 64; i++) {
if ((size_t)1 << i >= s) {
break;
}
}
return i;
}
typedef struct I_ {
uint16_t *data;
size_t capacity;
size_t size;
} I;
typedef struct F_ {
double *data;
size_t capacity;
int p;
} F;
void alloc_i(I *a, size_t cap){
a->data = (uint16_t*)malloc(cap * sizeof(uint16_t));
a->capacity = cap;
}
void free_i(I *a) {
free(a->data);
}
void alloc_f(F *a, int p) {
size_t cap = (size_t)1 << p;
a->data = (double*)malloc(cap * sizeof(double));
a->capacity = cap;
}
void free_f(F *a){
free(a->data);
}
void swap_i(I *a, I *b) {
I t = *a;
*a = *b;
*b = t;
}
void i2f(F *a, const I *b, int p){
size_t i;
size_t t360 = (size_t)1 << p;
a->p = p;
int carry = 0;
for (i = 0; i < b->size -1; i++){
int t = b->data[i] + carry;
if (t < (int)RADIX/2){
a->data[i] = t;
carry = 0;
}
else {
a->data[i] = (int)t - (int)RADIX;
carry = 1;
}
}
a->data[i++] = b->data[i] + carry;
for (; i < t360; i++) {
a->data[i] = 0.;
}
fouri(a->data, p);
}
void mul_f2i(I *a, const F *b, const F *c, F *d){
int p = b->p;
size_t t180 = (size_t)1 << p-1;
size_t t360 = t180 + t180;
size_t i;
int64_t carry;
size_t t;
size_t s;
d->data[0] = b->data[0] * c->data[0] * .5;
d->data[t180] = b->data[t180] * c->data[t180] * .5;
{
size_t k1 = 1;
size_t k2 = ((size_t)1<<p)-1;
size_t end = t180;
for (; k1 < end ; k1++,k2--){
double re = b->data[k1] * c->data[k1] - b->data[k2] * c->data[k2];
double im = b->data[k1] * c->data[k2] + b->data[k2] * c->data[k1];
d->data[k1] = re;
d->data[k2] = im;
}
}
fouriinv(d->data, p);
s = a->capacity < t360 ? a->capacity : t360;
carry = 0;
t = 1;
double k = ldexp(1., -p+1);
for (i = 0 ; i < s ; i++){
int64_t e = (int64_t)floor(d->data[i] * k + .5) + carry;
int16_t f;
carry = e / RADIX;
f = (int16_t)(e - carry * RADIX);
if (f < 0){
f += RADIX;
carry --;
}
a->data[i] = f;
if (f != 0) {
t = i + 1;
}
}
a->size = t;
}
void add_i(I *a, const I *b, const I *c) {
uint16_t carry = 0;
size_t i;
if (b->size > c->size){
const I *t = b;
b = c;
c = t;
}
for (i = 0; i < b->size; i++) {
uint16_t d = b->data[i] + c->data[i] + carry;
carry = 0;
if (d >= RADIX){
d -= RADIX;
carry ++;
}
a->data[i] = d;
}
for (; i < c->size; i++) {
uint16_t d = c->data[i] + carry;
carry = 0;
if (d >= RADIX){
d -= RADIX;
carry ++;
}
a->data[i] = d;
}
a->size = c->size;
if (carry != 0){
a->data[a->size++] = carry;
}
}
void print(const I *a){
size_t s = a->size;
printf("%u", a->data[--s]);
while (s != 0) {
printf("%04u", a->data[--s]);
}
}
void f(uint64_t n){
I a, b, c;
F x, y, z;
int i, p;
{
size_t cap = (size_t)floor((log(sqrt(1.25) + .5)*n - 0.5*log(5.)) * (1. / log((double)RADIX)) + 2.001);
if (cap <= 2) {
cap = 2;
}
p = s2p(cap);
alloc_i(&a, cap);
alloc_i(&b, cap);
alloc_i(&c, cap);
alloc_f(&x, p);
alloc_f(&y, p);
alloc_f(&z, p);
a.data[0] = 1;
a.size = 1;
b.data[0] = 0;
b.size = 1;
}
for (i = 63; i > 0; i--) {
p = s2p(b.size + b.size);
i2f(&x, &a, p);
i2f(&y, &b, p);
mul_f2i(&c, &y, &y, &z);
mul_f2i(&a, &x, &x, &z);
add_i(&a, &a, &c);
mul_f2i(&b, &x, &y, &z);
add_i(&b, &b, &b);
add_i(&b, &b, &c);
if (n+1 & (size_t)1 << i) {
add_i(&a, &a, &b);
swap_i(&a, &b);
}
}
if (n+1 & 1) {
add_i(&a, &a, &a);
add_i(&a, &a, &b);
p = s2p(a.size + b.size);
i2f(&x, &a, p);
i2f(&y, &b, p);
mul_f2i(&a, &x, &y, &z);
}
else {
p = s2p(a.size + a.size);
i2f(&x, &a, p);
mul_f2i(&a, &x, &x, &z);
p = s2p(b.size + b.size);
i2f(&y, &b, p);
mul_f2i(&b, &y, &y, &z);
add_i(&a, &a, &b);
}
printf("F(%llu) = ", n);
print(&a);
printf("\r\n");
free_i(&a);
free_i(&b);
free_i(&c);
free_f(&x);
free_f(&y);
free_f(&z);
}
int main(){
f(1000000000);
return 0;
}
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <math.h>

const uint32_t RADIX = 10000;
const double pi = 3.1415926535897932385;

double cos1;
double sin1;

void fr(double *s1,double *s2,double *end,size_t add,size_t t90){
	for(;s1<end;s1+=add,s2+=add){
		double r0,r1,r2,r3,m0,m1;

		r0=s1[0];
		r1=s2[0];
		r2=s1[t90];
		r3=s2[t90];

		m0=r2*cos1-r3*sin1;
		m1=r2*sin1+r3*cos1;

		s1[0]   = r0+m0;
		s2[0]   = r0-m0;
		s1[t90] =-r1+m1;
		s2[t90] = r1+m1;
	}
}

void fri(double *s1,double *s2,double *end,size_t add,size_t t90){
	for(;s1<end;s1+=add,s2+=add){
		double r0,r1,r2,r3,m0,m1,m2,m3;

		r0=s1[0];
		r1=s2[0];
		r2=s1[t90];
		r3=s2[t90];

		m0= r0+r1;
		m1=-r2+r3;
		m2= r0-r1;
		m3= r2+r3;

		s1[0]   = m0;
		s2[0]   = m1;
		s1[t90] = m2*cos1+m3*sin1;
		s2[t90] =-m2*sin1+m3*cos1;
	}
}

void fr0(double *s1,double *end,size_t add,size_t t90){
	for(;s1<end;s1+=add){
		double r0,r1;

		r0=s1[0];
		r1=s1[t90];

		s1[0] =r0+r1;
		s1[t90] =r0-r1;
	}
}

void swap_d(double *a, double *b) {
	double t = *a;
	*a = *b;
	*b = t;
}

void bxchg(double *s,int p){
	size_t t4, t5, t6;
	size_t t045, t090, t180, t270;

	t045 = (size_t)1<<p-3;
	t090 = t045 + t045;
	t180 = t090 + t090;
	t270 = t180 + t090;

	t4 = t090 - 4;
	t5 = t4;
	do {
		swap_d(&s[t4+1], &s[t180+t5]);
		swap_d(&s[t4+2], &s[t090+t5]);
		swap_d(&s[t4+3], &s[t270+t5]);
		swap_d(&s[t090+t4+1], &s[t180+t5+2]);
		swap_d(&s[t090+t4+3], &s[t270+t5+2]);
		swap_d(&s[t180+t4+3], &s[t270+t5+1]);

		if(t4 < t5){
			swap_d(&s[t4], &s[t5]);
			swap_d(&s[t090+t4+2], &s[t090+t5+2]);
			swap_d(&s[t180+t4+1], &s[t180+t5+1]);
			swap_d(&s[t270+t4+3], &s[t270+t5+3]);
		}
		if (t4 == 0){
			break;
		}

		t4 -= 4;
		t6 = t045;
		for(;;){
			t5 ^= t6;
			if((t5 & t6) == 0){
				break;
			}
			t6 >>= 1;
		}
	} while (1);
}

void bitexchg(double *s,int p){
	if (p <= 1){
	}
	else if (p == 2){
		swap_d(&s[1],&s[2]);
	}
	else if (p == 3){
		swap_d(&s[1],&s[4]);
		swap_d(&s[3],&s[6]);
	}
	else {
		bxchg(s,p);
	}
}

double* SIN_TABLE[64] = {0};

const double* sin_table(int p){
	if (p >= 2 && SIN_TABLE[p] == 0){
		size_t t090 = (size_t)1<<p-2;
		SIN_TABLE[p] = (double*)malloc(t090*sizeof(double));
		double k = 0.5 * pi / t090;
		for (int i = 0 ; i < t090 ; i++){
			SIN_TABLE[p][i] = sin(k * i);
		}
	}
	return SIN_TABLE[p];
}

void fouri(double *s, int p){
	const double* table = sin_table(p);

	bitexchg(s,p);

	size_t q = (size_t)1<<p;

	for (int i = 1;i <= p; i++){
		size_t r360 = (size_t)1<<i;
		size_t r180 = r360 / 2;
		size_t r090 = r180 / 2;
		size_t k1 = 0;
		size_t k2 = r180 - 1;

		fr0(&s[0], &s[q], r360, r180);
		k1 ++;

		size_t t0 = (size_t)1<<p-i;
		size_t t1 = ((size_t)1<<p-2) - t0;
		size_t t2 = (size_t)1<<p-i;
		for (;k1 < r090;k1 ++,k2 --){
			sin1 = table[t0];
			cos1 = table[t1];
			fr(&s[k1], &s[k2], &s[q], r360, r180);
			t0 += t2;
			t1 -= t2;
		}
	}
}

void fouriinv(double *s, int p){
	const double* table = sin_table(p);

	size_t q = (size_t)1<<p;

	for (int i = p;i >= 1; i--){
		size_t r360 = (size_t)1<<i;
		size_t r180 = r360 / 2;
		size_t r090 = r180 / 2;
		size_t k1 = 0;
		size_t k2 = r180 - 1;

		fr0(&s[0], &s[q], r360, r180);
		k1 ++;

		size_t t0 = (size_t)1<<p-i;
		size_t t1 = ((size_t)1<<p-2) - t0;
		size_t t2 = (size_t)1<<p-i;
		for (;k1 < r090;k1 ++,k2 --){
			sin1 = table[t0];
			cos1 = table[t1];
			fri(&s[k1], &s[k2], &s[q], r360, r180);
			t0 += t2;
			t1 -= t2;
		}
	}
	bitexchg(s,p);
}

int s2p(uint64_t s) {
	int i;
	for (i = 0; i < 64; i++) {
		if ((size_t)1 << i >= s) {
			break;
		}
	}
	return i;
}

typedef struct I_ {
	uint16_t *data;
	size_t capacity;
	size_t size;
} I;

typedef struct F_ {
	double *data;
	size_t capacity;
	int p;
} F;

void alloc_i(I *a, size_t cap){
	a->data = (uint16_t*)malloc(cap * sizeof(uint16_t));
	a->capacity = cap;
}

void free_i(I *a) {
	free(a->data);
}

void alloc_f(F *a, int p) {
	size_t cap = (size_t)1 << p;
	a->data = (double*)malloc(cap * sizeof(double));
	a->capacity = cap;
}

void free_f(F *a){
	free(a->data);
}

void swap_i(I *a, I *b) {
	I t = *a;
	*a = *b;
	*b = t;
}

void i2f(F *a, const I *b, int p){
	size_t i;
	size_t t360 = (size_t)1 << p;

	a->p = p;

	int carry = 0;
	for (i = 0; i < b->size -1; i++){
		int t = b->data[i] + carry;
		if (t < (int)RADIX/2){
			a->data[i] = t;
			carry = 0;
		}
		else {
			a->data[i] = (int)t - (int)RADIX;
			carry = 1;
		}
	}
	a->data[i++] = b->data[i] + carry;
	for (; i < t360; i++) {
		a->data[i] = 0.;
	}
	fouri(a->data, p);
}

void mul_f2i(I *a, const F *b, const F *c, F *d){
	int p = b->p;
	size_t t180 = (size_t)1 << p-1;
	size_t t360 = t180 + t180;
	size_t i;
	int64_t carry;
	size_t t;
	size_t s;

	d->data[0] = b->data[0] * c->data[0] * .5;
	d->data[t180] = b->data[t180] * c->data[t180] * .5;
	{
		size_t k1 = 1;
		size_t k2 = ((size_t)1<<p)-1;
		size_t end = t180;
		for (; k1 < end ; k1++,k2--){
			double re = b->data[k1] * c->data[k1] - b->data[k2] * c->data[k2];
			double im = b->data[k1] * c->data[k2] + b->data[k2] * c->data[k1];
			d->data[k1] = re;
			d->data[k2] = im;
		}
	}

	fouriinv(d->data, p);

	s = a->capacity < t360 ? a->capacity : t360;

	carry = 0;
	t = 1;
	double k = ldexp(1., -p+1);
	for (i = 0 ; i < s ; i++){
		int64_t e = (int64_t)floor(d->data[i] * k + .5) + carry;
		int16_t f;
		carry = e / RADIX;
		f = (int16_t)(e - carry * RADIX);
		if (f < 0){
			f += RADIX;
			carry --;
		}
		a->data[i] = f;
		if (f != 0) {
			t = i + 1;
		}
	}
	a->size = t;
}

void add_i(I *a, const I *b, const I *c) {
	uint16_t carry = 0;
	size_t i;
	if (b->size > c->size){
		const I *t = b;
		b = c;
		c = t;
	}

	for (i = 0; i < b->size; i++) {
		uint16_t d = b->data[i] + c->data[i] + carry;
		carry = 0;
		if (d >= RADIX){
			d -= RADIX;
			carry ++;
		}
		a->data[i] = d;
	}
	for (; i < c->size; i++) {
		uint16_t d = c->data[i] + carry;
		carry = 0;
		if (d >= RADIX){
			d -= RADIX;
			carry ++;
		}
		a->data[i] = d;
	}
	a->size = c->size;
	if (carry != 0){
		a->data[a->size++] = carry;
	}
}

void print(const I *a){
	size_t s = a->size;
	printf("%u", a->data[--s]);
	while (s != 0) {
		printf("%04u", a->data[--s]);
	}
}

void f(uint64_t n){
	I a, b, c;
	F x, y, z;
	int i, p;

	{
		size_t cap = (size_t)floor((log(sqrt(1.25) + .5)*n - 0.5*log(5.)) * (1. / log((double)RADIX)) + 2.001);
		if (cap <= 2) {
			cap = 2;
		}
		p = s2p(cap);
		alloc_i(&a, cap);
		alloc_i(&b, cap);
		alloc_i(&c, cap);
		alloc_f(&x, p);
		alloc_f(&y, p);
		alloc_f(&z, p);
		a.data[0] = 1;
		a.size = 1;
		b.data[0] = 0;
		b.size = 1;
	}

	for (i = 63; i > 0; i--) {
		p = s2p(b.size + b.size);
		i2f(&x, &a, p);
		i2f(&y, &b, p);
		mul_f2i(&c, &y, &y, &z);
		mul_f2i(&a, &x, &x, &z);
		add_i(&a, &a, &c);
		mul_f2i(&b, &x, &y, &z);
		add_i(&b, &b, &b);
		add_i(&b, &b, &c);
		if (n+1 & (size_t)1 << i) {
			add_i(&a, &a, &b);
			swap_i(&a, &b);
		}
	}
	if (n+1 & 1) {
		add_i(&a, &a, &a);
		add_i(&a, &a, &b);
		p = s2p(a.size + b.size);
		i2f(&x, &a, p);
		i2f(&y, &b, p);
		mul_f2i(&a, &x, &y, &z);
	}
	else {
		p = s2p(a.size + a.size);
		i2f(&x, &a, p);
		mul_f2i(&a, &x, &x, &z);
		p = s2p(b.size + b.size);
		i2f(&y, &b, p);
		mul_f2i(&b, &y, &y, &z);
		add_i(&a, &a, &b);
	}

	printf("F(%llu) = ", n);
	print(&a);
	printf("\r\n");

	free_i(&a);
	free_i(&b);
	free_i(&c);
	free_f(&x);
	free_f(&y);
	free_f(&z);
}

int main(){
	f(1000000000);
	return 0;
}
