fps/fps-ntt-friendly.hpp
Depends on
Verified with
Code
#pragma once
#include "fft/ntt.hpp"
#include "fps/formal-power-series.hpp"
template < class mint >
void FormalPowerSeries < mint >:: set_ntt () {
if ( ! ntt_ptr ) ntt_ptr = new NTT < mint > ;
}
template < class mint >
FormalPowerSeries < mint >& FormalPowerSeries < mint >:: operator *= ( const FormalPowerSeries < mint >& r ) {
if ( this -> empty () || r . empty ()) {
this -> clear ();
return * this ;
}
set_ntt ();
auto ret = static_cast < NTT < mint >*> ( ntt_ptr ) -> multiply ( * this , r );
return * this = FormalPowerSeries < mint > ( ret . begin (), ret . end ());
}
template < class mint >
FormalPowerSeries < mint > FormalPowerSeries < mint >:: middle_product ( const FormalPowerSeries < mint >& r ) const {
set_ntt ();
auto ret = static_cast < NTT < mint >*> ( ntt_ptr ) -> middle_product ( * this , r );
return FormalPowerSeries < mint > ( ret . begin (), ret . end ());
}
template < class mint >
void FormalPowerSeries < mint >:: ntt () {
set_ntt ();
static_cast < NTT < mint >*> ( ntt_ptr ) -> ntt ( * this );
}
template < class mint >
void FormalPowerSeries < mint >:: intt () {
set_ntt ();
static_cast < NTT < mint >*> ( ntt_ptr ) -> intt ( * this );
}
template < class mint >
void FormalPowerSeries < mint >:: ntt_doubling () {
set_ntt ();
static_cast < NTT < mint >*> ( ntt_ptr ) -> ntt_doubling ( * this );
}
template < typename mint >
int FormalPowerSeries < mint >:: ntt_root () {
set_ntt ();
return static_cast < NTT < mint >*> ( ntt_ptr ) -> g ;
}
template < typename mint >
FormalPowerSeries < mint > FormalPowerSeries < mint >:: inv ( int deg ) const {
assert (( * this )[ 0 ] != mint ( 0 ));
if ( deg == - 1 ) deg = ( * this ). size ();
FPS ret { mint ( 1 ) / ( * this )[ 0 ]};
for ( int i = 1 ; i < deg ; i <<= 1 )
ret = ( ret + ret - ret * ret * ( * this ). pre ( i << 1 )). pre ( i << 1 );
return ret . pre ( deg );
}
template < typename mint >
FormalPowerSeries < mint > FormalPowerSeries < mint >:: exp ( int deg ) const {
assert (( * this )[ 0 ] == mint ( 0 ));
if ( deg == - 1 ) deg = ( * this ). size ();
FPS ret { mint ( 1 )};
for ( int i = 1 ; i < deg ; i <<= 1 )
ret = ( ret * (( * this ). pre ( i << 1 ) - ret . log ( i << 1 ) + 1 )). pre ( i << 1 );
return ret . pre ( deg );
}
#line 2 "fps/fps-ntt-friendly.hpp"
#line 2 "fft/ntt.hpp"
template < class mint >
struct NTT {
static constexpr unsigned int mod = mint :: get_mod ();
static constexpr unsigned long long pow_constexpr ( unsigned long long x , unsigned long long n , unsigned long long m ) {
unsigned long long y = 1 ;
while ( n ) {
if ( n & 1 ) y = y * x % m ;
x = x * x % m ;
n >>= 1 ;
}
return y ;
}
static constexpr unsigned int get_g () {
unsigned long long x = 2 ;
while ( pow_constexpr ( x , ( mod - 1 ) >> 1 , mod ) == 1 ) x += 1 ;
return x ;
}
static constexpr unsigned int g = get_g ();
static constexpr int rank2 = __builtin_ctzll ( mod - 1 );
array < mint , rank2 + 1 > root ;
array < mint , rank2 + 1 > iroot ;
array < mint , max ( 0 , rank2 - 2 + 1 ) > rate2 ;
array < mint , max ( 0 , rank2 - 2 + 1 ) > irate2 ;
array < mint , max ( 0 , rank2 - 3 + 1 ) > rate3 ;
array < mint , max ( 0 , rank2 - 3 + 1 ) > irate3 ;
NTT () {
root [ rank2 ] = mint ( g ). pow (( mod - 1 ) >> rank2 );
iroot [ rank2 ] = root [ rank2 ]. inv ();
for ( int i = rank2 - 1 ; i >= 0 ; i -- ) {
root [ i ] = root [ i + 1 ] * root [ i + 1 ];
iroot [ i ] = iroot [ i + 1 ] * iroot [ i + 1 ];
}
{
mint prod = 1 , iprod = 1 ;
for ( int i = 0 ; i <= rank2 - 2 ; i ++ ) {
rate2 [ i ] = root [ i + 2 ] * prod ;
irate2 [ i ] = iroot [ i + 2 ] * iprod ;
prod *= iroot [ i + 2 ];
iprod *= root [ i + 2 ];
}
}
{
mint prod = 1 , iprod = 1 ;
for ( int i = 0 ; i <= rank2 - 3 ; i ++ ) {
rate3 [ i ] = root [ i + 3 ] * prod ;
irate3 [ i ] = iroot [ i + 3 ] * iprod ;
prod *= iroot [ i + 3 ];
iprod *= root [ i + 3 ];
}
}
}
void ntt ( vector < mint >& a ) {
int n = int ( a . size ());
int h = __builtin_ctzll (( unsigned int ) n );
a . resize ( 1 << h );
int len = 0 ; // a[i, i+(n>>len), i+2*(n>>len), ..] is transformed
while ( len < h ) {
if ( h - len == 1 ) {
int p = 1 << ( h - len - 1 );
mint rot = 1 ;
for ( int s = 0 ; s < ( 1 << len ); s ++ ) {
int offset = s << ( h - len );
for ( int i = 0 ; i < p ; i ++ ) {
auto l = a [ i + offset ];
auto r = a [ i + offset + p ] * rot ;
a [ i + offset ] = l + r ;
a [ i + offset + p ] = l - r ;
}
if ( s + 1 != ( 1 << len )) rot *= rate2 [ __builtin_ctzll ( ~ ( unsigned int )( s ))];
}
len ++ ;
} else {
// 4-base
int p = 1 << ( h - len - 2 );
mint rot = 1 , imag = root [ 2 ];
for ( int s = 0 ; s < ( 1 << len ); s ++ ) {
mint rot2 = rot * rot ;
mint rot3 = rot2 * rot ;
int offset = s << ( h - len );
for ( int i = 0 ; i < p ; i ++ ) {
auto mod2 = 1ULL * mint :: get_mod () * mint :: get_mod ();
auto a0 = 1ULL * a [ i + offset ]. val ();
auto a1 = 1ULL * a [ i + offset + p ]. val () * rot . val ();
auto a2 = 1ULL * a [ i + offset + 2 * p ]. val () * rot2 . val ();
auto a3 = 1ULL * a [ i + offset + 3 * p ]. val () * rot3 . val ();
auto a1na3imag = 1ULL * mint ( a1 + mod2 - a3 ). val () * imag . val ();
auto na2 = mod2 - a2 ;
a [ i + offset ] = a0 + a2 + a1 + a3 ;
a [ i + offset + 1 * p ] = a0 + a2 + ( 2 * mod2 - ( a1 + a3 ));
a [ i + offset + 2 * p ] = a0 + na2 + a1na3imag ;
a [ i + offset + 3 * p ] = a0 + na2 + ( mod2 - a1na3imag );
}
if ( s + 1 != ( 1 << len )) rot *= rate3 [ __builtin_ctzll ( ~ ( unsigned int )( s ))];
}
len += 2 ;
}
}
}
void intt ( vector < mint >& a ) {
int n = int ( a . size ());
int h = __builtin_ctzll (( unsigned int ) n );
a . resize ( 1 << h );
int len = h ; // a[i, i+(n>>len), i+2*(n>>len), ..] is transformed
while ( len ) {
if ( len == 1 ) {
int p = 1 << ( h - len );
mint irot = 1 ;
for ( int s = 0 ; s < ( 1 << ( len - 1 )); s ++ ) {
int offset = s << ( h - len + 1 );
for ( int i = 0 ; i < p ; i ++ ) {
auto l = a [ i + offset ];
auto r = a [ i + offset + p ];
a [ i + offset ] = l + r ;
a [ i + offset + p ] = ( unsigned long long )( mint :: get_mod () + l . val () - r . val ()) * irot . val ();
}
if ( s + 1 != ( 1 << ( len - 1 ))) irot *= irate2 [ __builtin_ctzll ( ~ ( unsigned int )( s ))];
}
len -- ;
} else {
// 4-base
int p = 1 << ( h - len );
mint irot = 1 , iimag = iroot [ 2 ];
for ( int s = 0 ; s < ( 1 << ( len - 2 )); s ++ ) {
mint irot2 = irot * irot ;
mint irot3 = irot2 * irot ;
int offset = s << ( h - len + 2 );
for ( int i = 0 ; i < p ; i ++ ) {
auto a0 = 1ULL * a [ i + offset + 0 * p ]. val ();
auto a1 = 1ULL * a [ i + offset + 1 * p ]. val ();
auto a2 = 1ULL * a [ i + offset + 2 * p ]. val ();
auto a3 = 1ULL * a [ i + offset + 3 * p ]. val ();
auto a2na3iimag = 1ULL * mint (( mint :: get_mod () + a2 - a3 ) * iimag . val ()). val ();
a [ i + offset ] = a0 + a1 + a2 + a3 ;
a [ i + offset + 1 * p ] = ( a0 + ( mint :: get_mod () - a1 ) + a2na3iimag ) * irot . val ();
a [ i + offset + 2 * p ] = ( a0 + a1 + ( mint :: get_mod () - a2 ) + ( mint :: get_mod () - a3 )) * irot2 . val ();
a [ i + offset + 3 * p ] = ( a0 + ( mint :: get_mod () - a1 ) + ( mint :: get_mod () - a2na3iimag )) * irot3 . val ();
}
if ( s + 1 != ( 1 << ( len - 2 ))) irot *= irate3 [ __builtin_ctzll ( ~ ( unsigned int )( s ))];
}
len -= 2 ;
}
}
mint e = mint ( n ). inv ();
for ( auto & x : a ) x *= e ;
}
vector < mint > multiply ( const vector < mint >& a , const vector < mint >& b ) {
if ( a . empty () || b . empty ()) return vector < mint > ();
int n = a . size (), m = b . size ();
int sz = n + m - 1 ;
if ( n <= 30 || m <= 30 ) {
if ( n > 30 ) return multiply ( b , a );
vector < mint > res ( sz );
for ( int i = 0 ; i < n ; i ++ )
for ( int j = 0 ; j < m ; j ++ ) res [ i + j ] += a [ i ] * b [ j ];
return res ;
}
int sz1 = 1 ;
while ( sz1 < sz ) sz1 <<= 1 ;
vector < mint > res ( sz1 );
for ( int i = 0 ; i < n ; i ++ ) res [ i ] = a [ i ];
ntt ( res );
if ( a == b )
for ( int i = 0 ; i < sz1 ; i ++ ) res [ i ] *= res [ i ];
else {
vector < mint > c ( sz1 );
for ( int i = 0 ; i < m ; i ++ ) c [ i ] = b [ i ];
ntt ( c );
for ( int i = 0 ; i < sz1 ; i ++ ) res [ i ] *= c [ i ];
}
intt ( res );
res . resize ( sz );
return res ;
}
// c[i]=sum[j]a[j]b[i+j]
vector < mint > middle_product ( const vector < mint >& a , const vector < mint >& b ) {
if ( b . empty () || a . size () > b . size ()) return {};
int n = a . size (), m = b . size ();
int sz = m - n + 1 ;
if ( n <= 30 || sz <= 30 ) {
vector < mint > res ( sz );
for ( int i = 0 ; i < sz ; i ++ )
for ( int j = 0 ; j < n ; j ++ ) res [ i ] += a [ j ] * b [ i + j ];
return res ;
}
int sz1 = 1 ;
while ( sz1 < m ) sz1 <<= 1 ;
vector < mint > res ( sz1 ), b2 ( sz1 );
reverse_copy ( a . begin (), a . end (), res . begin ());
copy ( b . begin (), b . end (), b2 . begin ());
ntt ( res );
ntt ( b2 );
for ( int i = 0 ; i < res . size (); i ++ ) res [ i ] *= b2 [ i ];
intt ( res );
res . resize ( m );
res . erase ( res . begin (), res . begin () + n - 1 );
return res ;
}
void ntt_doubling ( vector < mint >& a ) {
int n = ( int ) a . size ();
auto b = a ;
intt ( b );
mint r = 1 , zeta = mint ( g ). pow (( mint :: get_mod () - 1 ) / ( n << 1 ));
for ( int i = 0 ; i < n ; i ++ ) b [ i ] *= r , r *= zeta ;
ntt ( b );
copy ( b . begin (), b . end (), back_inserter ( a ));
}
};
/**
* @brief NTT (数論変換)
* @docs docs/fft/ntt.md
*/
#line 2 "fps/formal-power-series.hpp"
template < class mint >
struct FormalPowerSeries : vector < mint > {
using vector < mint >:: vector ;
using FPS = FormalPowerSeries ;
FPS & operator += ( const FPS & r ) {
if ( r . size () > this -> size ()) this -> resize ( r . size ());
for ( int i = 0 ; i < ( int ) r . size (); i ++ ) ( * this )[ i ] += r [ i ];
return * this ;
}
FPS & operator += ( const mint & r ) {
if ( this -> empty ()) this -> resize ( 1 );
( * this )[ 0 ] += r ;
return * this ;
}
FPS & operator -= ( const FPS & r ) {
if ( r . size () > this -> size ()) this -> resize ( r . size ());
for ( int i = 0 ; i < ( int ) r . size (); i ++ ) ( * this )[ i ] -= r [ i ];
return * this ;
}
FPS & operator -= ( const mint & r ) {
if ( this -> empty ()) this -> resize ( 1 );
( * this )[ 0 ] -= r ;
return * this ;
}
FPS & operator *= ( const mint & v ) {
for ( int k = 0 ; k < ( int ) this -> size (); k ++ ) ( * this )[ k ] *= v ;
return * this ;
}
FPS & operator /= ( const FPS & r ) {
if ( this -> size () < r . size ()) {
this -> clear ();
return * this ;
}
int n = this -> size () - r . size () + 1 ;
if (( int ) r . size () <= 64 ) {
FPS f ( * this ), g ( r );
g . shrink ();
mint coeff = g . at ( g . size () - 1 ). inv ();
for ( auto & x : g ) x *= coeff ;
int deg = ( int ) f . size () - ( int ) g . size () + 1 ;
int gs = g . size ();
FPS quo ( deg );
for ( int i = deg - 1 ; i >= 0 ; i -- ) {
quo [ i ] = f [ i + gs - 1 ];
for ( int j = 0 ; j < gs ; j ++ ) f [ i + j ] -= quo [ i ] * g [ j ];
}
* this = quo * coeff ;
this -> resize ( n , mint ( 0 ));
return * this ;
}
return * this = (( * this ). rev (). pre ( n ) * r . rev (). inv ( n )). pre ( n ). rev ();
}
FPS & operator %= ( const FPS & r ) {
* this -= * this / r * r ;
shrink ();
return * this ;
}
FPS operator + ( const FPS & r ) const { return FPS ( * this ) += r ; }
FPS operator + ( const mint & v ) const { return FPS ( * this ) += v ; }
FPS operator - ( const FPS & r ) const { return FPS ( * this ) -= r ; }
FPS operator - ( const mint & v ) const { return FPS ( * this ) -= v ; }
FPS operator * ( const FPS & r ) const { return FPS ( * this ) *= r ; }
FPS operator * ( const mint & v ) const { return FPS ( * this ) *= v ; }
FPS operator / ( const FPS & r ) const { return FPS ( * this ) /= r ; }
FPS operator % ( const FPS & r ) const { return FPS ( * this ) %= r ; }
FPS operator - () const {
FPS ret ( this -> size ());
for ( int i = 0 ; i < ( int ) this -> size (); i ++ ) ret [ i ] = - ( * this )[ i ];
return ret ;
}
void shrink () {
while ( this -> size () && this -> back () == mint ( 0 )) this -> pop_back ();
}
FPS rev () const {
FPS ret ( * this );
reverse ( begin ( ret ), end ( ret ));
return ret ;
}
FPS dot ( FPS r ) const {
FPS ret ( min ( this -> size (), r . size ()));
for ( int i = 0 ; i < ( int ) ret . size (); i ++ ) ret [ i ] = ( * this )[ i ] * r [ i ];
return ret ;
}
FPS pre ( int sz ) const {
return FPS ( begin ( * this ), begin ( * this ) + min (( int ) this -> size (), sz ));
}
FPS operator >>= ( int sz ) {
assert ( sz >= 0 );
if (( int ) this -> size () <= sz ) return {};
this -> erase ( this -> begin (), this -> begin () + sz );
return * this ;
}
FPS operator >> ( int sz ) const {
if (( int ) this -> size () <= sz ) return {};
FPS ret ( * this );
ret . erase ( ret . begin (), ret . begin () + sz );
return ret ;
}
FPS operator <<= ( int sz ) {
assert ( sz >= 0 );
this -> insert ( this -> begin (), sz , mint ( 0 ));
return * this ;
}
FPS operator << ( int sz ) const {
FPS ret ( * this );
ret . insert ( ret . begin (), sz , mint ( 0 ));
return ret ;
}
FPS diff () const {
const int n = ( int ) this -> size ();
FPS ret ( max ( 0 , n - 1 ));
mint one ( 1 ), coeff ( 1 );
for ( int i = 1 ; i < n ; i ++ ) {
ret [ i - 1 ] = ( * this )[ i ] * coeff ;
coeff += one ;
}
return ret ;
}
FPS integral () const {
const int n = ( int ) this -> size ();
FPS ret ( n + 1 );
ret [ 0 ] = mint ( 0 );
if ( n > 0 ) ret [ 1 ] = mint ( 1 );
auto mod = mint :: get_mod ();
for ( int i = 2 ; i <= n ; i ++ ) ret [ i ] = ( - ret [ mod % i ]) * ( mod / i );
for ( int i = 0 ; i < n ; i ++ ) ret [ i + 1 ] *= ( * this )[ i ];
return ret ;
}
mint eval ( mint x ) const {
mint r = 0 , w = 1 ;
for ( auto & v : * this ) r += w * v , w *= x ;
return r ;
}
FPS log ( int deg = - 1 ) const {
assert (( * this )[ 0 ] == mint ( 1 ));
if ( deg == - 1 ) deg = ( int ) this -> size ();
return ( this -> diff () * this -> inv ( deg )). pre ( deg - 1 ). integral ();
}
FPS pow ( int64_t k , int deg = - 1 ) const {
const int n = ( int ) this -> size ();
if ( deg == - 1 ) deg = n ;
if ( k == 0 ) {
FPS ret ( deg );
if ( deg ) ret [ 0 ] = 1 ;
return ret ;
}
for ( int i = 0 ; i < n ; i ++ ) {
if (( * this )[ i ] != mint ( 0 )) {
mint rev = mint ( 1 ) / ( * this )[ i ];
FPS ret = ((( * this * rev ) >> i ). log ( deg ) * k ). exp ( deg );
ret *= ( * this )[ i ]. pow ( k );
ret = ( ret << ( i * k )). pre ( deg );
if (( int ) ret . size () < deg ) ret . resize ( deg , mint ( 0 ));
return ret ;
}
if ( __int128_t ( i + 1 ) * k >= deg ) return FPS ( deg , mint ( 0 ));
}
return FPS ( deg , mint ( 0 ));
}
static void * ntt_ptr ;
static void set_ntt ();
FPS & operator *= ( const FPS & r );
FPS middle_product ( const FPS & r ) const ;
void ntt ();
void intt ();
void ntt_doubling ();
static int ntt_root ();
FPS inv ( int deg = - 1 ) const ;
FPS exp ( int deg = - 1 ) const ;
};
template < typename mint >
void * FormalPowerSeries < mint >:: ntt_ptr = nullptr ;
#line 5 "fps/fps-ntt-friendly.hpp"
template < class mint >
void FormalPowerSeries < mint >:: set_ntt () {
if ( ! ntt_ptr ) ntt_ptr = new NTT < mint > ;
}
template < class mint >
FormalPowerSeries < mint >& FormalPowerSeries < mint >:: operator *= ( const FormalPowerSeries < mint >& r ) {
if ( this -> empty () || r . empty ()) {
this -> clear ();
return * this ;
}
set_ntt ();
auto ret = static_cast < NTT < mint >*> ( ntt_ptr ) -> multiply ( * this , r );
return * this = FormalPowerSeries < mint > ( ret . begin (), ret . end ());
}
template < class mint >
FormalPowerSeries < mint > FormalPowerSeries < mint >:: middle_product ( const FormalPowerSeries < mint >& r ) const {
set_ntt ();
auto ret = static_cast < NTT < mint >*> ( ntt_ptr ) -> middle_product ( * this , r );
return FormalPowerSeries < mint > ( ret . begin (), ret . end ());
}
template < class mint >
void FormalPowerSeries < mint >:: ntt () {
set_ntt ();
static_cast < NTT < mint >*> ( ntt_ptr ) -> ntt ( * this );
}
template < class mint >
void FormalPowerSeries < mint >:: intt () {
set_ntt ();
static_cast < NTT < mint >*> ( ntt_ptr ) -> intt ( * this );
}
template < class mint >
void FormalPowerSeries < mint >:: ntt_doubling () {
set_ntt ();
static_cast < NTT < mint >*> ( ntt_ptr ) -> ntt_doubling ( * this );
}
template < typename mint >
int FormalPowerSeries < mint >:: ntt_root () {
set_ntt ();
return static_cast < NTT < mint >*> ( ntt_ptr ) -> g ;
}
template < typename mint >
FormalPowerSeries < mint > FormalPowerSeries < mint >:: inv ( int deg ) const {
assert (( * this )[ 0 ] != mint ( 0 ));
if ( deg == - 1 ) deg = ( * this ). size ();
FPS ret { mint ( 1 ) / ( * this )[ 0 ]};
for ( int i = 1 ; i < deg ; i <<= 1 )
ret = ( ret + ret - ret * ret * ( * this ). pre ( i << 1 )). pre ( i << 1 );
return ret . pre ( deg );
}
template < typename mint >
FormalPowerSeries < mint > FormalPowerSeries < mint >:: exp ( int deg ) const {
assert (( * this )[ 0 ] == mint ( 0 ));
if ( deg == - 1 ) deg = ( * this ). size ();
FPS ret { mint ( 1 )};
for ( int i = 1 ; i < deg ; i <<= 1 )
ret = ( ret * (( * this ). pre ( i << 1 ) - ret . log ( i << 1 ) + 1 )). pre ( i << 1 );
return ret . pre ( deg );
}
Back to top page