提交记录 5178


用户 题目 状态 得分 用时 内存 语言 代码长度
f321dd 1002i. 【模板题】多项式乘法 Accepted 100 15.124 ms 10660 KB C++ 2.21 KB
提交时间 评测时间
2018-08-10 13:45:26 2020-08-01 00:13:37
#pragma GCC target("sse2")
#pragma GCC optimize("Ofast,no-stack-protector,unroll-loops,fast-math")
#include<algorithm>
#include<cstdio>
#include<cmath>
#include<immintrin.h>
#define get(a,i)((double*)&a)[i]
typedef unsigned u32;
struct ano{
	char a[1<<20],b[1<<21];
	char*s,*t;
	ano():s(a),t(b){
		fread(a,1,sizeof a,stdin);
	}
	~ano(){fwrite(b,1,t-b,stdout);}
	operator u32(){
		u32 x=0;
		while(*s<48)++s;
		while(*s>32)
			x=x*10+*s++-48;
		return x;
	}
	void out(u32 x){
		static char c[12];
		char*i=c;
		if(!x)*t++=48;
		else{
			while(x){
				u32 y=x/10;
				*i++=x-y*10+48,x=y;
			}
			while(i!=c)*t++=*--i;
		}
		*t++=32;
	}
}buf;
typedef __m128d vec;
inline vec mul(vec a,vec b){
	vec u=_mm_mul_pd(a,b);
	vec v=_mm_mul_pd(a,_mm_loadr_pd((double*)&b));
	return _mm_setr_pd(get(u,0)-get(u,1),get(v,0)+get(v,1));
}
using namespace std;
const u32 N=1<<17;
const double pi=acos(-1.);
inline vec conj(vec a){
	return _mm_setr_pd(get(a,0),-get(a,1));
}
vec w[N/2],a[N],b[N],c[N];
void fft(vec*a,u32 n){
	for(u32 i=0,j=0;i<n;++i){
		if(i<j)
			swap(a[i],a[j]);
		for(u32 k=n>>1;;k>>=1)
			if((j^=k)>=k)break;
	}
	w[0]=_mm_set_sd(1);
	for(u32 i=1;i<n;i<<=1){
		vec s=_mm_setr_pd(cos(pi/i),sin(pi/i));
		for(int j=i-2;j>0;j-=2)
			w[j]=w[j>>1];
		for(u32 j=1;j<i;j+=2)
			w[j]=mul(s,w[j-1]);
		for(u32 j=0;j<n;j+=i<<1){
			vec*b=a+j,*c=b+i;
			for(u32 k=0;k<i;++k){
				vec v=mul(w[k],c[k]);
				c[k]=_mm_sub_pd(b[k],v);
				b[k]=_mm_add_pd(b[k],v);
			}
		}
	}
}
void read(vec*a,u32 n){
	for(u32 i=0;i<n/2;++i){
		u32 x=buf,y=buf;
		a[i]=_mm_setr_pd(x,y);
	}
	if(n&1)
		a[n/2]=_mm_set_sd(buf);
}
signed main(){
	static u32 n=buf+1,m=buf+1,l=1<<__lg(n+m-1);
	if(n<=1000000/m){
		static u32 a[N],c[N];
		for(u32 i=0;i<n;++i)
			a[i]=buf;
		for(u32 i=0;i<m;++i){
			u32 x=buf;
			for(u32 j=0;j<n;++j)
				c[i+j]+=x*a[j];
		}
		for(u32 i=0;i<n+m-1;++i)
			buf.out(c[i]);
		exit(0);
	}
	read(a,n);
	read(b,m);
	fft(a,l);
	fft(b,l);
	for(u32 i=0;i<l;++i){
		u32 j=l-i&l-1;
		c[j]=mul(_mm_setr_pd(0,.25),_mm_sub_pd(mul(conj(mul(a[j],b[j])),_mm_set_sd(4)),mul(mul(_mm_sub_pd(conj(a[j]),a[i]),_mm_sub_pd(conj(b[j]),b[i])),_mm_add_pd(i<l/2?w[i]:mul(w[i-l/2],_mm_set_sd(-1)),_mm_set_sd(1)))));
	}
	fft(c,l);
	for(u32 i=0;i<n+m-1;++i)
		buf.out(get(c[i>>1],~i&1)/l+.5);
}

CompilationN/AN/ACompile OKScore: N/A

Subtask #1 Testcase #112.41 us44 KBAcceptedScore: 0

Subtask #1 Testcase #214.907 ms10 MB + 260 KBAcceptedScore: 100

Subtask #1 Testcase #31.177 ms1 MB + 164 KBAcceptedScore: 0

Subtask #1 Testcase #41.143 ms1 MB + 532 KBAcceptedScore: 0

Subtask #1 Testcase #512.13 us44 KBAcceptedScore: 0

Subtask #1 Testcase #611.43 us44 KBAcceptedScore: 0

Subtask #1 Testcase #711.73 us44 KBAcceptedScore: 0

Subtask #1 Testcase #814.217 ms9 MB + 680 KBAcceptedScore: 0

Subtask #1 Testcase #914.185 ms9 MB + 680 KBAcceptedScore: 0

Subtask #1 Testcase #1013.505 ms9 MB + 76 KBAcceptedScore: 0

Subtask #1 Testcase #1115.124 ms10 MB + 420 KBAcceptedScore: 0

Subtask #1 Testcase #1212.111 ms8 MB + 176 KBAcceptedScore: 0

Subtask #1 Testcase #1311.59 us44 KBAcceptedScore: 0


Judge Duck Online | 评测鸭在线
Server Time: 2024-05-04 02:54:21 | Loaded in 1 ms | Server Status
个人娱乐项目,仅供学习交流使用