/*
Author: Ishmeet Dosanjh
Date of Created: 1/12/17
Version: 0.1
*/
#pragma comment(linker, "/stack:20000000")
#pragma GCC optimize("Ofast")
#pragma GCC target("sse,sse2,sse3,ssse3,sse4,popcnt,abm,mmx,avx,tune=native")
#define _CRT_SECURE_NO_WARNINGS
#include <climits>
# include <iostream>
# include <cmath>
# include <algorithm>
# include <stdio.h>
# include <cstdint>
# include <cstring>
# include <string>
# include <cstdlib>
# include <vector>
# include <bitset>
# include <map>
# include <queue>
# include <ctime>
# include <stack>
# include <set>
# include <list>
# include <random>
# include <deque>
# include <functional>
# include <iomanip>
# include <sstream>
# include <fstream>
# include <complex>
# include <numeric>
# include <immintrin.h>
# include <cassert>
# include <array>
# include <tuple>
// #include <unordered_set> i ngcc 6.6
using namespace std;
// Let's define unordered map
# ifdef __GNUC__
# if __cplusplus > 199711L
# include <unordered_set>
# include <unordered_map>
# else
# include <tr1/unordered_map>
# include <tr1/unordered_set>
using namespace tr1;
# endif
# else
# include <unordered_map>
# include <unordered_set>
# endif
#define VA_NUM_ARGS(...) VA_NUM_ARGS_IMPL_((0,__VA_ARGS__, 6,5,4,3,2,1))
#define VA_NUM_ARGS_IMPL_(tuple) VA_NUM_ARGS_IMPL tuple
#define VA_NUM_ARGS_IMPL(_0,_1,_2,_3,_4,_5,_6,N,...) N
#define macro_dispatcher(macro, ...) macro_dispatcher_(macro, VA_NUM_ARGS(__VA_ARGS__))
#define macro_dispatcher_(macro, nargs) macro_dispatcher__(macro, nargs)
#define macro_dispatcher__(macro, nargs) macro_dispatcher___(macro, nargs)
#define macro_dispatcher___(macro, nargs) macro ## nargs
#define DBN1(a) cerr<<#a<<"="<<(a)<<"\n"
#define DBN2(a,b) cerr<<#a<<"="<<(a)<<", "<<#b<<"="<<(b)<<"\n"
#define DBN3(a,b,c) cerr<<#a<<"="<<(a)<<", "<<#b<<"="<<(b)<<", "<<#c<<"="<<(c)<<"\n"
#define DBN4(a,b,c,d) cerr<<#a<<"="<<(a)<<", "<<#b<<"="<<(b)<<", "<<#c<<"="<<(c)<<", "<<#d<<"="<<(d)<<"\n"
#define DBN5(a,b,c,d,e) cerr<<#a<<"="<<(a)<<", "<<#b<<"="<<(b)<<", "<<#c<<"="<<(c)<<", "<<#d<<"="<<(d)<<", "<<#e<<"="<<(e)<<"\n"
#define DBN6(a,b,c,d,e,f) cerr<<#a<<"="<<(a)<<", "<<#b<<"="<<(b)<<", "<<#c<<"="<<(c)<<", "<<#d<<"="<<(d)<<", "<<#e<<"="<<(e)<<", "<<#f<<"="<<(f)<<"\n"
#define DBN(...) macro_dispatcher(DBN, __VA_ARGS__)(__VA_ARGS__)
#define DA(a,n) cerr<<#a<<"=["; printarray(a,n); cerr<<"]\n"
#define DAR(a,n,s) cerr<<#a<<"["<<s<<"-"<<n-1<<"]=["; printarray(a,n,s); cerr<<"]\n"
#ifdef _MSC_VER
#define PREFETCH(ptr, rw, level) ((void)0)
#else
#define PREFETCH(ptr, rw, level) __builtin_prefetch(ptr, rw, level)
#endif
#ifdef LOCAL
#define CURTIME() cerr << clock() * 1.0 / CLOCKS_PER_SEC << endl
#else
#define CURTIME()
#endif
#define pb push_back
#define mp make_pair
typedef long long ll;
typedef unsigned int uint;
typedef unsigned long long ull;
typedef double d;
typedef float f;
typedef pair< int , int > pii;
typedef pair< long long , long long > pll;
typedef vector< int > vi;
typedef vector< long long > vll;
typedef int itn;
typedef long l;
/***************************************************************/
// TEMPLATE DECLARATIONS
template < class T1, class T2, class T3>
struct triple{ T1 a; T2 b; T3 c; triple( ) : a( T1( ) ) , b( T2( ) ) , c( T3( ) ) { } ; triple( T1 _a, T2 _b, T3 _c) : a( _a) , b( _b) , c( _c) { } } ;
template < class T1, class T2, class T3>
bool operator< ( const triple< T1,T2,T3> & t1,const triple< T1,T2,T3> & t2) { if ( t1.a ! = t2.a ) return t1.a < t2.a ; else if ( t1.b ! = t2.b ) return t1.b < t2.b ; else return t1.c < t2.c ; }
template < class T1, class T2, class T3>
bool operator> ( const triple< T1,T2,T3> & t1,const triple< T1,T2,T3> & t2) { if ( t1.a ! = t2.a ) return t1.a > t2.a ; else if ( t1.b ! = t2.b ) return t1.b > t2.b ; else return t1.c > t2.c ; }
#define tri triple<int,int,int>
#define trll triple<ll,ll,ll>
//for 1 based arrays
#define FI2(n) for(int i=1;i<=(n);++i)
#define FJ2(n) for(int j=1;j<=(n);++j)
#define FK2(n) for(int k=1;k<=(n);++k)
//for 0 based indexed arrays
#define FI(n) for(long i=0;i<(n);i++)
#define FJ(n) for(long long j=0;j<(n);j++)
#define FK(n) for(int k=0;k<(n);++k)
#define FL(n) for(int l=0;l<(n);++l)
#define FQ(n) for(int q=0;q<(n);++q)
#define FOR(i,a,b) for(int i = (a), __e = (int) (b); i < __e; ++i)
#define all(a) std::begin(a), std::end(a)
#define reunique(v) v.resize(std::unique(v.begin(), v.end()) - v.begin())
#define sqr(x) ((x) * (x))
#define sqrt(x) sqrt(1.0 * (x))
#define pow(x, n) pow(1.0 * (x), n)
#define COMPARE(obj) [&](const std::decay_t<decltype(obj)>& a, const std::decay_t<decltype(obj)>& b)
#define COMPARE_BY(obj, field) [&](const std::decay_t<decltype(obj)>& a, const std::decay_t<decltype(obj)>& b) { return a.field < b.field; }
#define checkbit(n, b) (((n) >> (b)) & 1)
#define setbit(n, b) ((n) | (static_cast<std::decay_t<decltype(n)>>(1) << (b)))
#define removebit(n, b) ((n) & ~(static_cast<std::decay_t<decltype(n)>>(1) << (b)))
#define flipbit(n, b) ((n) ^ (static_cast<std::decay_t<decltype(n)>>(1) << (b)))
inline int countBits( uint v) { v= v- ( ( v>> 1 ) & 0x55555555 ) ; v= ( v& 0x33333333 ) + ( ( v>> 2 ) & 0x33333333 ) ; return ( ( v+ ( v>> 4 ) & 0xF0F0F0F ) * 0x1010101 ) >> 24 ; }
inline int countBits( ull v) { uint t= v>> 32 ; uint p= ( v & ( ( 1ULL << 32 ) - 1 ) ) ; return countBits( t) + countBits( p) ; }
inline int countBits( ll v) { return countBits( ( ull) v) ; }
inline int countBits( int v) { return countBits( ( uint) v) ; }
unsigned int reverseBits( uint x) { x = ( ( ( x & 0xaaaaaaaa ) >> 1 ) | ( ( x & 0x55555555 ) << 1 ) ) ; x = ( ( ( x & 0xcccccccc ) >> 2 ) | ( ( x & 0x33333333 ) << 2 ) ) ; x = ( ( ( x & 0xf0f0f0f0 ) >> 4 ) | ( ( x & 0x0f0f0f0f ) << 4 ) ) ; x = ( ( ( x & 0xff00ff00 ) >> 8 ) | ( ( x & 0x00ff00ff ) << 8 ) ) ; return ( ( x >> 16 ) | ( x << 16 ) ) ; }
template < class T> inline int sign( T x) { return x > 0 ? 1 : x < 0 ? - 1 : 0 ; }
inline bool isPowerOfTwo( int x) { return ( x ! = 0 && ( x& ( x - 1 ) ) == 0 ) ; }
constexpr ll power( ll x, int p) { return p == 0 ? 1 : ( x * power( x, p - 1 ) ) ; }
template < class T1, class T2, class T3> T1 inline clamp( T1 x, const T2& a, const T3& b) { if ( x < a) return a; else if ( x > b) return b; else return x; }
unsigned long long rdtsc( ) { unsigned long long ret = 0 ;
#ifdef __clang__
return __builtin_readcyclecounter( ) ;
#endif
#ifndef _MSC_VER
asm volatile ( "rdtsc" : "=A" ( ret) : : ) ;
#endif
return ret; }
// Fast IO ********************************************************************************************************
const int __BS = 4096 ;
static char __bur[ __BS + 16 ] , * __er = __bur + __BS, * __ir = __er;
template < class T = int > T readInt( ) {
auto c = [ & ] ( ) { if ( __ir == __er) std:: fill ( __bur, __bur + __BS, 0 ) , cin .read ( __bur, __BS) , __ir = __bur; } ;
c( ) ; while ( * __ir && ( * __ir < '0' || * __ir > '9' ) && * __ir ! = '-' ) ++ __ir; c( ) ;
bool m = false ; if ( * __ir == '-' ) ++ __ir, c( ) , m = true ;
T r = 0 ; while ( * __ir >= '0' && * __ir <= '9' ) r = r * 10 + * __ir - '0' , ++ __ir, c( ) ;
++ __ir; return m ? - r : r;
}
static char __buw[ __BS + 20 ] , * __iw = __buw, * __ew = __buw + __BS;
template < class T>
void writeInt( T x, char endc = '\n ' ) {
if ( x < 0 ) * __iw++ = '-' , x = - x; if ( x == 0 ) * __iw++ = '0' ;
char * s = __iw;
while ( x) { T t = x / 10 ; char c = x - 10 * t + '0' ; * __iw++ = c; x = t; }
char * f = __iw - 1 ; while ( s < f) swap( * s, * f) , ++ s, -- f;
if ( __iw > __ew) cout .write ( __buw, __iw - __buw) , __iw = __buw;
* __iw++ = endc;
}
template < class T>
void writeStr( const T& str) {
int i = 0 ; while ( str[ i] ) { * __iw++ = str[ i++ ] ; if ( __iw > __ew) cout .write ( __buw, __iw - __buw) , __iw = __buw; }
}
struct __FL__ { ~__FL__( ) { if ( __iw ! = __buw) cout .write ( __buw, __iw - __buw) ; } } ;
static __FL__ __flushVar__;
//STL output *****************************************************************************************************
#define TT1 template<class T>
#define TT1T2 template<class T1, class T2>
#define TT1T2T3 template<class T1, class T2, class T3>
TT1T2 ostream& operator << ( ostream& os, const pair< T1, T2> & p) ;
TT1 ostream& operator << ( ostream& os, const vector< T> & v) ;
TT1T2 ostream& operator << ( ostream& os, const set< T1, T2> & v) ;
TT1T2 ostream& operator << ( ostream& os, const multiset< T1, T2> & v) ;
TT1T2 ostream& operator << ( ostream& os, priority_queue< T1, T2> v) ;
TT1T2T3 ostream& operator << ( ostream& os, const map< T1, T2, T3> & v) ;
TT1T2T3 ostream& operator << ( ostream& os, const multimap< T1, T2, T3> & v) ;
TT1T2T3 ostream& operator << ( ostream& os, const triple< T1, T2, T3> & t) ;
template < class T, size_t N> ostream& operator << ( ostream& os, const array< T, N> & v) ;
TT1T2 ostream& operator << ( ostream& os, const pair< T1, T2> & p) { return os << "(" << p.first << ", " << p.second << ")" ; }
TT1 ostream& operator << ( ostream& os, const vector< T> & v) { bool f= 1 ; os<< "[" ; for ( auto & i : v) { if ( ! f) os << ", " ; os<< i; f= 0 ; } return os << "]" ; }
template < class T, size_t N> ostream& operator << ( ostream& os, const array< T, N> & v) { bool f= 1 ; os<< "[" ; for ( auto & i : v) { if ( ! f) os << ", " ; os<< i; f= 0 ; } return os << "]" ; }
TT1T2 ostream& operator << ( ostream& os, const set< T1, T2> & v) { bool f= 1 ; os<< "[" ; for ( auto & i : v) { if ( ! f) os << ", " ; os<< i; f= 0 ; } return os << "]" ; }
TT1T2 ostream& operator << ( ostream& os, const multiset< T1,T2> & v) { bool f= 1 ; os<< "[" ; for ( auto & i : v) { if ( ! f) os << ", " ; os<< i; f= 0 ; } return os << "]" ; }
TT1T2T3 ostream& operator << ( ostream& os, const map< T1,T2,T3> & v) { bool f = 1 ; os << "[" ; for ( auto & ii : v) { if ( ! f) os << ", " ; os << "(" << ii.first << " -> " << ii.second << ") " ; f = 0 ; } return os << "]" ; }
TT1T2 ostream& operator << ( ostream& os, const multimap< T1, T2> & v) { bool f = 1 ; os << "[" ; for ( auto & ii : v) { if ( ! f) os << ", " ; os << "(" << ii.first << " -> " << ii.second << ") " ; f = 0 ; } return os << "]" ; }
TT1T2 ostream& operator << ( ostream& os, priority_queue< T1, T2> v) { bool f = 1 ; os << "[" ; while ( ! v.empty ( ) ) { auto x = v.top ( ) ; v.pop ( ) ; if ( ! f) os << ", " ; f = 0 ; os << x; } return os << "]" ; }
TT1T2T3 ostream& operator << ( ostream& os, const triple< T1, T2, T3> & t) { return os << "(" << t.a << ", " << t.b << ", " << t.c << ")" ; }
TT1T2 void printarray( const T1& a, T2 sz, T2 beg = 0 ) { for ( T2 i = beg; i< sz; i++ ) cout << a[ i] << " " ; cout << endl; }
//STL input *****************************************************************************************************
TT1T2T3 inline istream& operator >> ( istream& os, triple< T1, T2, T3> & t) ;
TT1T2 inline istream& operator >> ( istream& os, pair< T1, T2> & p) { return os >> p.first >> p.second ; }
TT1 inline istream& operator >> ( istream& os, vector< T> & v) {
if ( v.size ( ) ) for ( T& t : v) os >> t; else {
string s; T obj; while ( s.empty ( ) ) { getline( os, s) ; if ( ! os) return os; }
stringstream ss( s) ; while ( ss >> obj) v.push_back ( obj) ;
}
return os;
}
TT1T2T3 inline istream& operator >> ( istream& os, triple< T1, T2, T3> & t) { return os >> t.a >> t.b >> t.c ; }
//Pair magic *****************************************************************************************************
#define PT1T2 pair<T1, T2>
TT1T2 inline PT1T2 operator+ ( const PT1T2 & p1 , const PT1T2 & p2) { return PT1T2( p1.first + p2.first , p1.second + p2.second ) ; }
TT1T2 inline PT1T2& operator+ = ( PT1T2 & p1 , const PT1T2 & p2) { p1.first + = p2.first , p1.second + = p2.second ; return p1; }
TT1T2 inline PT1T2 operator- ( const PT1T2 & p1 , const PT1T2 & p2) { return PT1T2( p1.first - p2.first , p1.second - p2.second ) ; }
TT1T2 inline PT1T2& operator- = ( PT1T2 & p1 , const PT1T2 & p2) { p1.first - = p2.first , p1.second - = p2.second ; return p1; }
#undef TT1
#undef TT1T2
#undef TT1T2T3
#define FREIN(FILE) freopen(FILE, "rt", stdin)
#define FREOUT(FILE) freopen(FILE, "wt", stdout)
#ifdef LOCAL
#define BEGIN_PROFILE(idx, name) int profileIdx = idx; profileName[profileIdx] = name; totalTime[profileIdx] -= rdtsc() / 1e3;
#define END_PROFILE totalTime[profileIdx] += rdtsc() / 1e3; totalCount[profileIdx]++;
#else
#define BEGIN_PROFILE(idx, name)
#define END_PROFILE
#endif
template < class T> inline void normmod( T & x, T m) { x % = m; if ( x < 0 ) x + = m; }
template < class T1, class T2> inline T2 summodfast( T1 x, T1 y, T2 m) { T2 res = x + y; if ( res >= m) res - = m; return res; }
template < class T1, class T2, class T3> inline void addmodfast( T1 & x, T2 y, T3 m) { x + = y; if ( x >= m) x - = m; }
template < class T1, class T2, class T3> inline void submodfast( T1 & x, T2 y, T3 m) { x - = y; if ( x < 0 ) x + = m; }
#if INTPTR_MAX == INT32_MAX or !defined(__SIZEOF_INT128__)
inline ll mulmod( ll x, ll n, ll m) { ll r = 0 ; normmod( x, m) ; normmod( n, m) ; while ( n) { if ( n & 1 ) r + = x; x + = x; if ( r >= m) r - = m; if ( x >= m) x - = m; n / = 2 ; } return r; }
#else
using int128 = __int128;
inline ll mulmod( ll x, ll n, ll m) { return __int128( x) * n % m; }
#endif
inline ll powmod( ll x, ll n, ll m) { ll r = 1 ; normmod( x, m) ; while ( n) { if ( n & 1 ) r = ( r* x) % m; x = ( x* x) % m; n / = 2 ; } return r; }
inline ll powmulmod( ll x, ll n, ll m) { ll res = 1 ; normmod( x, m) ; while ( n) { if ( n & 1 ) res = mulmod( res, x, m) ; x = mulmod( x, x, m) ; n / = 2 ; } return res; }
template < class T> inline T gcd( T a, T b) { while ( b) { a % = b; T t = a; a = b; b = t; } return a; }
inline ll lcm( ll a, ll b) { return a / gcd( a, b) * b; }
template < class T> inline T gcd( T a, T b, T c) { return gcd( gcd( a, b) , c) ; }
ll gcdex( ll a, ll b, ll& x, ll& y) {
if ( ! a) { x = 0 ; y = 1 ; return b; }
ll y1; ll d = gcdex( b % a, a, y, y1) ; x = y1 - ( b / a) * y;
return d;
}
template < class T> bool isPrime( T x) { if ( x <= 4 || x % 2 == 0 || x % 3 == 0 ) return x == 2 || x == 3 ;
for ( T i = 5 ; i * i <= x; i + = 6 ) if ( x % i == 0 || x % ( i + 2 ) == 0 ) return 0 ; return 1 ; }
bool millerRabin( long long n) {
if ( n <= 1000 ) return isPrime( n) ;
long long s = n - 1 ; int t = 0 ; while ( s % 2 == 0 ) s / = 2 , ++ t;
for ( int a : { 2 , 325 , 9375 , 28178 , 450775 , 9780504 , 1795265022 } ) { if ( ! ( a % = n) ) return true ;
long long f = powmulmod( a, s, n) ; if ( f == 1 || f == n - 1 ) continue ;
for ( int i = 1 ; i < t; ++ i) if ( ( f = mulmod( f, f, n) ) == n - 1 ) goto nextp;
return false ; nextp:;
} return true ;
}
//some modulus and gcd type functions
const int mod = 1e9 + 7 ;
ll powmod( ll a,ll b) { ll res= 1 ; if ( a>= mod) a% = mod; for ( ; b; b>>= 1 ) { if ( b& 1 ) res= res* a; if ( res>= mod) res% = mod; a= a* a; if ( a>= mod) a% = mod; } return res; }
ll gcd( ll a , ll b) { return a== 0 ? b: gcd( b% a,a) ; }
// Useful constants
int some_primes[ 7 ] = { 24443 , 100271 , 1000003 , 1000333 , 5000321 , 98765431 , 1000000123 } ;
#define T9 1000000000
#define T18 1000000000000000000LL
#define INF 1011111111
#define LLINF 1000111000111000111LL
#define EPS (double)1e-10
#define PI 3.14159265358979323846264
#define link asaxlajrewqwe
#define rank wahayawehasdakw
// modulo
#define mod %
#define NUM 1000000007
#define NUM1 1000000009
//scanf type macros
#define s(n) scanf("%d", &n)
#define sl(n) scanf("%ld", &n)
#define sl3(n1,n2,n3) scanf("%lld %lld %lld ", &n1, &n2, &n3)
#define sl4(n1,n2,n3,n4) scanf("%ld %ld %ld %ld", &n1, &n2, &n3, &n4)
#define sll(n) scanf("%I64d", &n)
#define sll2(n) scanf("%lld", &n)
//printf type macros
#define p(n) printf("%d\n", n)
#define pl(n) printf("%ld\n",n)
#define pl3(n1,n2,n3) printf("%lld %lld %lld\n ", n1, n2, n3)
#define pl4(n1,n2,n3,n4) printf("%ld %ld %ld %ld\n ", n1, n2, n3, n4)
#define pll(n) printf("%I64d\n",n)
#define pll2(n) printf("%lld\n",n)
//*************************************************************************************
int32_t solve( ) ;
// C function for extended Euclidean Algorithm
ll gcdExtended( ll a, ll b, ll * x, ll * y) ;
// Function to find modulo inverse of a
ll modInverse( ll a, ll m)
{
ll x, y;
ll g = gcdExtended( a, m, & x, & y) ;
if ( g ! = 1 ) { }
// cout << "Inverse doesn't exist";
else
{
// m is added to handle negative x
ll res = ( x% m + m) % m;
// cout << "Modular multiplicative inverse is " <<
return res;
}
}
// C function for extended Euclidean Algorithm
ll gcdExtended( ll a, ll b, ll * x, ll * y)
{
// Base Case
if ( a == 0 )
{
* x = 0 , * y = 1 ;
return b;
}
ll x1, y1; // To store results of recursive call
ll gcd = gcdExtended( b% a, a, & x1, & y1) ;
// Update x and y using results of recursive
// call
* x = y1 - ( b/ a) * x1;
* y = x1;
return gcd;
}
int32_t main( int argc, char ** argv) {
ios_base:: sync_with_stdio ( 0 ) ; cin .tie ( 0 ) ;
#ifdef LOCAL
FREIN( "input.txt" ) ;
// FREOUT("out.txt");
#endif
return solve( ) ;
}
//red blue ok but i hate palindromes
int32_t solve( ) {
int t; l jspecial,n,j,q,qi,Li,Ri,prevli,prevri,i; //qi is the query iterator here
ll p,x;
s( t) ;
while ( t-- ) {
x= 0 ;
sl( n) ,sll2( p) ,sl( q) ;
ll ppA[ n] ; //prefix product array
ll A[ n] ,prod= 1 ;
FI( n) { sll2( A[ i] ) ; prod= ( prod* A[ i] ) % p,ppA[ i] = prod; }
//for 2 d matrix storing
// for (i = 0; i < n; i++) {
// /* code */
// prod=A[i]%p;
// ppA[i][i]=(prod%p);
// for (j = i+1; j < n; j++) {
// /* code */
// prod=(prod%p*A[j]%p)%p;
// ppA[i][j]=(prod)%p;
// }
// prod=1;
// }
// for (i = 0; i < n; i++) {
// /* code */
for ( j = 0 ; j < n; j++ ) {
/* code */
cout << ppA[ j] << " " ;
}
cout << "\n " ;
// }
l B[ ( ll) floor ( ( double ) q/ ( double ) 64 ) + 2 ] ;
FJ( sizeof ( B) / sizeof ( B[ 0 ] ) ) sl( B[ j] ) ;
// ll sqrtdecompose[(l)ceil(sqrt(n))];
// builddecompostion(A,p,n,sqrtdecompose);
// precomputing(A,n,p);
// l colsize=(l)floor(log(n));
// ll lookup[n][colsize];
//sparse table approach preprocessing O(nlogn) query O(1)
// for (i = 0; i < n; i++) lookup[i][0]=A[i];
// for (j = 1; (1<<j)<= n; j++)//till logn
// /* code */
// for (i = 0; i <= n-(1<<j); i++) {
// /* code */
// //range 2 ki power hai ya nhi it is an part of an query
// lookup[i][j]=((lookup[i][j-1]%p)*((lookup[i+(1<<(j-1))][j-1])%p))%p;
// }
// } //lookup matrix for all possible subarrays of length pow(2,j) for all possible values of j as 0,1,2,3,4,5 up till log(n)
//taran rakha
for ( qi= 0 ; qi< ( q) ; qi++ ) {
if ( qi% 64 == 0 ) //here always first it will executes
{
if ( qi== 0 ) x= 0 ;
Li = ( B[ qi/ 64 ] + x) % n, Ri = ( B[ ( qi/ 64 ) + 1 ] + x) % n;
}
else { Li = ( prevli + x) % n, Ri = ( prevri + x) % n; }
if ( Li> Ri) swap( Li,Ri) ; //O(1) time operation
// x=(lookup[Li][Ri]+1)%p;
//(ans(Li,Ri,A,p,n,sqrtdecompose)
// jspecial=(l)log2(Ri-Li+1);
// if(jspecial%2==0) {x=(lookup[Li][jspecial]+1)%p;}
// else {
// x=(((lookup[Li][jspecial]+lookup[R-(1<<(jspecial))+1][jspecial])/2)+1)%p;
// }
// if(ppA[Li]!=0)
// x=((((ppA[Ri])/ppA[Li-1]))+1)%p;
// std::cout << ppA[Li][Ri-Li] << std::endl;
// <--- @taran check from here --->
x= ( ( ( ppA[ Ri] ) * ( modInverse( ppA[ Li- 1 ] ,p) ) ) % p+ 1 ) % p;
// else
prevli= Li,prevri= Ri;
}
pll2( x% p) ;
}
return 0 ;
}
//sq root decompostion tehcnique used
// #define MAX 1000000
// ll lookup[MAX][MAX];
// void builddecompostion(ll A[],ll p,l n,ll sqrtdecompose[]){
// l blocksize=(l)ceil(sqrt(n));
// l decomposeitera=0;
// ll prod=1;
// for (l i = 0; i < n; i++) {
// /* code */
// prod=((prod*A[i]));
// if(i+1%blocksize==0) {
// sqrtdecompose[decomposeitera++]=prod;
// prod=1;
// }
// }
// }
// ll ans(l Li,l Ri,ll A[],ll p,l n,ll sqrtdecompose[]){
// l blocksize=(l)ceil(sqrt(n));
// // int blockno=Li/blocksize;
// ll prod=1;
// //case 1 starting case handle alsos true when itis not overlapping any block completely
// while(Li%blocksize!=0&&Li<=Ri){
// prod=((prod)*A[Li])%p;//add %p here
// Li++;
// }
// // prod%=p; case 2 for complete overlapping
// while(Li+blocksize<=Ri){
// prod=((prod)*((sqrtdecompose[Li/blocksize])))%p;
// Li+=blocksize;
// }
// // case3 remainig n unoverlapped elements
// while(Li<=Ri) {
// prod=((prod)*(A[Li]))%p;Li++;//add %p here
// }
// return prod;
// }
// 1 approach of the precomputing with theu se of an GLOBAL LOOKUP MATRIX OF SIZE MAX MAX...
// void precomputing(ll A[],l n,ll p){
// l i;
// for (l j= 0; j < (l)log(n); ++j)
// {
// i=0;
// /* code */
// while(i<n)
// {
// /* code */
// if(j==0) lookup[i][j]=i;
// else {
// lookup[i][j]=((lookup[i][j-1]%p)*(lookup[i + (1<<(j-1))][j-1])%p)%p;
// }
// i++;
// }
// }
// }
    /*
    Author: Ishmeet Dosanjh
    Date of Created: 1/12/17
    Version: 0.1 
    */
     
    #pragma comment(linker, "/stack:20000000")
    #pragma GCC optimize("Ofast")
    #pragma GCC target("sse,sse2,sse3,ssse3,sse4,popcnt,abm,mmx,avx,tune=native")
     
    #define _CRT_SECURE_NO_WARNINGS
    #include  <climits>
    # include <iostream>
    # include <cmath>
    # include <algorithm>
    # include <stdio.h>
    # include <cstdint>
    # include <cstring>
    # include <string>
    # include <cstdlib>
    # include <vector>
    # include <bitset>
    # include <map>
    # include <queue>
    # include <ctime>
    # include <stack>
    # include <set>
    # include <list>
    # include <random>
    # include <deque>
    # include <functional>
    # include <iomanip>
    # include <sstream>
    # include <fstream>
    # include <complex>
    # include <numeric>
    # include <immintrin.h>
    # include <cassert>
    # include <array>
    # include <tuple>
    // #include <unordered_set> i ngcc 6.6
    using namespace std;
     
    // Let's define unordered map
    # ifdef __GNUC__
    # if __cplusplus > 199711L
    # include <unordered_set>
    # include <unordered_map>
    # else
    # include <tr1/unordered_map>
    # include <tr1/unordered_set>
    using namespace tr1;
    # endif
    # else
    # include <unordered_map>
    # include <unordered_set>
    # endif
     
    #define VA_NUM_ARGS(...) VA_NUM_ARGS_IMPL_((0,__VA_ARGS__, 6,5,4,3,2,1))
    #define VA_NUM_ARGS_IMPL_(tuple) VA_NUM_ARGS_IMPL tuple
    #define VA_NUM_ARGS_IMPL(_0,_1,_2,_3,_4,_5,_6,N,...) N
    #define macro_dispatcher(macro, ...) macro_dispatcher_(macro, VA_NUM_ARGS(__VA_ARGS__))
    #define macro_dispatcher_(macro, nargs) macro_dispatcher__(macro, nargs)
    #define macro_dispatcher__(macro, nargs) macro_dispatcher___(macro, nargs)
    #define macro_dispatcher___(macro, nargs) macro ## nargs
    #define DBN1(a)           cerr<<#a<<"="<<(a)<<"\n"
    #define DBN2(a,b)         cerr<<#a<<"="<<(a)<<", "<<#b<<"="<<(b)<<"\n"
    #define DBN3(a,b,c)       cerr<<#a<<"="<<(a)<<", "<<#b<<"="<<(b)<<", "<<#c<<"="<<(c)<<"\n"
    #define DBN4(a,b,c,d)     cerr<<#a<<"="<<(a)<<", "<<#b<<"="<<(b)<<", "<<#c<<"="<<(c)<<", "<<#d<<"="<<(d)<<"\n"
    #define DBN5(a,b,c,d,e)   cerr<<#a<<"="<<(a)<<", "<<#b<<"="<<(b)<<", "<<#c<<"="<<(c)<<", "<<#d<<"="<<(d)<<", "<<#e<<"="<<(e)<<"\n"
    #define DBN6(a,b,c,d,e,f) cerr<<#a<<"="<<(a)<<", "<<#b<<"="<<(b)<<", "<<#c<<"="<<(c)<<", "<<#d<<"="<<(d)<<", "<<#e<<"="<<(e)<<", "<<#f<<"="<<(f)<<"\n"
    #define DBN(...) macro_dispatcher(DBN, __VA_ARGS__)(__VA_ARGS__)
    #define DA(a,n) cerr<<#a<<"=["; printarray(a,n); cerr<<"]\n"
    #define DAR(a,n,s) cerr<<#a<<"["<<s<<"-"<<n-1<<"]=["; printarray(a,n,s); cerr<<"]\n"
     
    #ifdef _MSC_VER
    #define PREFETCH(ptr, rw, level) ((void)0)
    #else
    #define PREFETCH(ptr, rw, level) __builtin_prefetch(ptr, rw, level)
    #endif
     
    #ifdef LOCAL
    #define CURTIME() cerr << clock() * 1.0 / CLOCKS_PER_SEC << endl
    #else
    #define CURTIME()
    #endif
    #define pb push_back
    #define mp make_pair
    typedef long long ll;
    typedef unsigned int uint;
    typedef unsigned long long ull;
    typedef double d;
    typedef float f;
    typedef pair<int, int> pii;
    typedef pair<long long, long long> pll;
    typedef vector<int> vi;
    typedef vector<long long> vll;
    typedef int itn;
    typedef long l;
    /***************************************************************/
    // TEMPLATE DECLARATIONS 
    template<class T1, class T2, class T3>
    struct triple{ T1 a; T2 b; T3 c; triple() : a(T1()), b(T2()), c(T3()) {}; triple(T1 _a, T2 _b, T3 _c) :a(_a), b(_b), c(_c){} };
    template<class T1, class T2, class T3>
    bool operator<(const triple<T1,T2,T3>&t1,const triple<T1,T2,T3>&t2){if(t1.a!=t2.a)return t1.a<t2.a;else if(t1.b!=t2.b)return t1.b<t2.b;else return t1.c<t2.c;}
    template<class T1, class T2, class T3>
    bool operator>(const triple<T1,T2,T3>&t1,const triple<T1,T2,T3>&t2){if(t1.a!=t2.a)return t1.a>t2.a;else if(t1.b!=t2.b)return t1.b>t2.b;else return t1.c>t2.c;}
    #define tri triple<int,int,int>
    #define trll triple<ll,ll,ll>
     
     
    //for 1 based arrays 
     
    #define FI2(n) for(int i=1;i<=(n);++i)
    #define FJ2(n) for(int j=1;j<=(n);++j)
    #define FK2(n) for(int k=1;k<=(n);++k)
    //for 0 based indexed arrays 
    #define FI(n) for(long i=0;i<(n);i++)
    #define FJ(n) for(long long j=0;j<(n);j++)
    #define FK(n) for(int k=0;k<(n);++k)
    #define FL(n) for(int l=0;l<(n);++l)
    #define FQ(n) for(int q=0;q<(n);++q)
    #define FOR(i,a,b) for(int i = (a), __e = (int) (b); i < __e; ++i)
    #define all(a) std::begin(a), std::end(a)
    #define reunique(v) v.resize(std::unique(v.begin(), v.end()) - v.begin())
     
    #define sqr(x) ((x) * (x))
    #define sqrt(x) sqrt(1.0 * (x))
    #define pow(x, n) pow(1.0 * (x), n)
     
    #define COMPARE(obj) [&](const std::decay_t<decltype(obj)>& a, const std::decay_t<decltype(obj)>& b)
    #define COMPARE_BY(obj, field) [&](const std::decay_t<decltype(obj)>& a, const std::decay_t<decltype(obj)>& b) { return a.field < b.field; }
     
    #define checkbit(n, b) (((n) >> (b)) & 1)
    #define setbit(n, b) ((n) | (static_cast<std::decay_t<decltype(n)>>(1) << (b)))
    #define removebit(n, b) ((n) & ~(static_cast<std::decay_t<decltype(n)>>(1) << (b)))
    #define flipbit(n, b) ((n) ^ (static_cast<std::decay_t<decltype(n)>>(1) << (b)))
    inline int countBits(uint v){v=v-((v>>1)&0x55555555);v=(v&0x33333333)+((v>>2)&0x33333333);return((v+(v>>4)&0xF0F0F0F)*0x1010101)>>24;}
    inline int countBits(ull v){uint t=v>>32;uint p=(v & ((1ULL << 32) - 1)); return countBits(t) + countBits(p); }
    inline int countBits(ll v){return countBits((ull)v); }
    inline int countBits(int v){return countBits((uint)v); }
    unsigned int reverseBits(uint x){ x = (((x & 0xaaaaaaaa) >> 1) | ((x & 0x55555555) << 1)); x = (((x & 0xcccccccc) >> 2) | ((x & 0x33333333) << 2)); x = (((x & 0xf0f0f0f0) >> 4) | ((x & 0x0f0f0f0f) << 4)); x = (((x & 0xff00ff00) >> 8) | ((x & 0x00ff00ff) << 8)); return((x >> 16) | (x << 16)); }
    template<class T> inline int sign(T x){ return x > 0 ? 1 : x < 0 ? -1 : 0; }
    inline bool isPowerOfTwo(int x){ return (x != 0 && (x&(x - 1)) == 0); }
    constexpr ll power(ll x, int p) { return p == 0 ? 1 : (x * power(x, p - 1)); }
    template<class T1, class T2, class T3> T1 inline clamp(T1 x, const T2& a, const T3& b) { if (x < a) return a; else if (x > b) return b; else return x; }
    unsigned long long rdtsc() { unsigned long long ret = 0;
    #ifdef __clang__
        return __builtin_readcyclecounter();
    #endif
    #ifndef _MSC_VER
        asm volatile("rdtsc" : "=A" (ret) : :);
    #endif
        return ret; }
    // Fast IO ********************************************************************************************************
    const int __BS = 4096;
    static char __bur[__BS + 16], *__er = __bur + __BS, *__ir = __er;
    template<class T = int> T readInt() {
        auto c = [&]() { if (__ir == __er) std::fill(__bur, __bur + __BS, 0), cin.read(__bur, __BS), __ir = __bur; };
        c(); while (*__ir && (*__ir < '0' || *__ir > '9') && *__ir != '-') ++__ir; c();
        bool m = false; if (*__ir == '-') ++__ir, c(), m = true;
        T r = 0; while (*__ir >= '0' && *__ir <= '9') r = r * 10 + *__ir - '0', ++__ir, c();
        ++__ir; return m ? -r : r;
    }
    static char __buw[__BS + 20], *__iw = __buw, *__ew = __buw + __BS;
    template<class T>
    void writeInt(T x, char endc = '\n') {
        if (x < 0) *__iw++ = '-', x = -x; if (x == 0) *__iw++ = '0';
        char* s = __iw;
        while (x) { T t = x / 10; char c = x - 10 * t + '0'; *__iw++ = c; x = t; }
        char* f = __iw - 1; while (s < f) swap(*s, *f), ++s, --f;
        if (__iw > __ew) cout.write(__buw, __iw - __buw), __iw = __buw;
        *__iw++ = endc;
    }
    template<class T>
    void writeStr(const T& str) {
        int i = 0; while (str[i]) { *__iw++ = str[i++]; if (__iw > __ew) cout.write(__buw, __iw - __buw), __iw = __buw; }
    }
    struct __FL__ { ~__FL__() { if (__iw != __buw) cout.write(__buw, __iw - __buw); } };
    static __FL__ __flushVar__;
     
    //STL output *****************************************************************************************************
    #define TT1 template<class T>
    #define TT1T2 template<class T1, class T2>
    #define TT1T2T3 template<class T1, class T2, class T3>
    TT1T2 ostream& operator << (ostream& os, const pair<T1, T2>& p);
    TT1 ostream& operator << (ostream& os, const vector<T>& v);
    TT1T2 ostream& operator << (ostream& os, const set<T1, T2>&v);
    TT1T2 ostream& operator << (ostream& os, const multiset<T1, T2>&v);
    TT1T2 ostream& operator << (ostream& os, priority_queue<T1, T2> v);
    TT1T2T3 ostream& operator << (ostream& os, const map<T1, T2, T3>& v);
    TT1T2T3 ostream& operator << (ostream& os, const multimap<T1, T2, T3>& v);
    TT1T2T3 ostream& operator << (ostream& os, const triple<T1, T2, T3>& t);
    template<class T, size_t N> ostream& operator << (ostream& os, const array<T, N>& v);
    TT1T2 ostream& operator << (ostream& os, const pair<T1, T2>& p){ return os <<"("<<p.first<<", "<< p.second<<")"; }
    TT1 ostream& operator << (ostream& os, const vector<T>& v){       bool f=1;os<<"[";for(auto& i : v) { if (!f)os << ", ";os<<i;f=0;}return os << "]"; }
    template<class T, size_t N> ostream& operator << (ostream& os, const array<T, N>& v) {     bool f=1;os<<"[";for(auto& i : v) { if (!f)os << ", ";os<<i;f=0;}return os << "]"; }
    TT1T2 ostream& operator << (ostream& os, const set<T1, T2>&v){    bool f=1;os<<"[";for(auto& i : v) { if (!f)os << ", ";os<<i;f=0;}return os << "]"; }
    TT1T2 ostream& operator << (ostream& os, const multiset<T1,T2>&v){bool f=1;os<<"[";for(auto& i : v) { if (!f)os << ", ";os<<i;f=0;}return os << "]"; }
    TT1T2T3 ostream& operator << (ostream& os, const map<T1,T2,T3>& v){ bool f = 1; os << "["; for (auto& ii : v) { if (!f)os << ", "; os << "(" << ii.first << " -> " << ii.second << ") "; f = 0; }return os << "]"; }
    TT1T2 ostream& operator << (ostream& os, const multimap<T1, T2>& v){ bool f = 1; os << "["; for (auto& ii : v) { if (!f)os << ", "; os << "(" << ii.first << " -> " << ii.second << ") "; f = 0; }return os << "]"; }
    TT1T2 ostream& operator << (ostream& os, priority_queue<T1, T2> v) { bool f = 1; os << "["; while (!v.empty()) { auto x = v.top(); v.pop(); if (!f) os << ", "; f = 0; os << x; } return os << "]"; }
    TT1T2T3 ostream& operator << (ostream& os, const triple<T1, T2, T3>& t){ return os << "(" << t.a << ", " << t.b << ", " << t.c << ")"; }
    TT1T2 void printarray(const T1& a, T2 sz, T2 beg = 0){ for (T2 i = beg; i<sz; i++) cout << a[i] << " "; cout << endl; }
     
    //STL input *****************************************************************************************************
    TT1T2T3 inline istream& operator >> (istream& os, triple<T1, T2, T3>& t);
    TT1T2 inline istream& operator >> (istream& os, pair<T1, T2>& p) { return os >> p.first >> p.second; }
    TT1 inline istream& operator >> (istream& os, vector<T>& v) {
        if (v.size()) for (T& t : v) os >> t; else {
            string s; T obj; while (s.empty()) {getline(os, s); if (!os) return os;}
            stringstream ss(s); while (ss >> obj) v.push_back(obj);
        }
        return os;
    }
    TT1T2T3 inline istream& operator >> (istream& os, triple<T1, T2, T3>& t) { return os >> t.a >> t.b >> t.c; }
     
    //Pair magic *****************************************************************************************************
    #define PT1T2 pair<T1, T2>
    TT1T2 inline PT1T2 operator+(const PT1T2 &p1 , const PT1T2 &p2) { return PT1T2(p1.first + p2.first, p1.second + p2.second); }
    TT1T2 inline PT1T2& operator+=(PT1T2 &p1 , const PT1T2 &p2) { p1.first += p2.first, p1.second += p2.second; return p1; }
    TT1T2 inline PT1T2 operator-(const PT1T2 &p1 , const PT1T2 &p2) { return PT1T2(p1.first - p2.first, p1.second - p2.second); }
    TT1T2 inline PT1T2& operator-=(PT1T2 &p1 , const PT1T2 &p2) { p1.first -= p2.first, p1.second -= p2.second; return p1; }
     
    #undef TT1
    #undef TT1T2
    #undef TT1T2T3
     
    #define FREIN(FILE) freopen(FILE, "rt", stdin)
    #define FREOUT(FILE) freopen(FILE, "wt", stdout)
    #ifdef LOCAL
    #define BEGIN_PROFILE(idx, name) int profileIdx = idx; profileName[profileIdx] = name; totalTime[profileIdx] -= rdtsc() / 1e3;
    #define END_PROFILE totalTime[profileIdx] += rdtsc() / 1e3; totalCount[profileIdx]++;
    #else
    #define BEGIN_PROFILE(idx, name)
    #define END_PROFILE
    #endif
     
    template<class T> inline void normmod(T &x, T m) { x %= m; if (x < 0) x += m; }
    template<class T1, class T2> inline T2 summodfast(T1 x, T1 y, T2 m) { T2 res = x + y; if (res >= m) res -= m; return res; }
    template<class T1, class T2, class T3> inline void addmodfast(T1 &x, T2 y, T3 m) { x += y; if (x >= m) x -= m; }
    template<class T1, class T2, class T3> inline void submodfast(T1 &x, T2 y, T3 m) { x -= y; if (x < 0) x += m; }
    #if INTPTR_MAX == INT32_MAX or !defined(__SIZEOF_INT128__)
    inline ll mulmod(ll x, ll n, ll m){ ll r = 0; normmod(x, m); normmod(n, m); while (n) { if (n & 1) r += x; x += x; if (r >= m) r -= m; if (x >= m) x -= m; n /= 2; } return r; }
    #else
    using int128 = __int128;
    inline ll mulmod(ll x, ll n, ll m){ return __int128(x) * n % m; }
    #endif
    inline ll powmod(ll x, ll n, ll m){ ll r = 1; normmod(x, m); while (n){ if (n & 1)r = (r*x) % m; x = (x*x) % m; n /= 2; }return r; }
    inline ll powmulmod(ll x, ll n, ll m) { ll res = 1; normmod(x, m); while (n){ if (n & 1)res = mulmod(res, x, m); x = mulmod(x, x, m); n /= 2; } return res; }
    template<class T> inline T gcd(T a, T b) { while (b) { a %= b; T t = a; a = b; b = t; } return a; }
    inline ll lcm(ll a, ll b){ return a / gcd(a, b) * b; }
    template<class T> inline T gcd(T a, T b, T c){ return gcd(gcd(a, b), c); }
    ll gcdex(ll a, ll b, ll& x, ll& y) {
        if (!a) { x = 0; y = 1; return b; }
        ll y1; ll d = gcdex(b % a, a, y, y1); x = y1 - (b / a) * y;
        return d;
    }
    template<class T> bool isPrime(T x) { if (x <= 4 || x % 2 == 0 || x % 3 == 0) return x == 2 || x == 3;
        for (T i = 5; i * i <= x; i += 6) if (x % i == 0 || x % (i + 2) == 0) return 0; return 1; }
    bool millerRabin(long long n) {
        if (n <= 1000) return isPrime(n);
        long long s = n - 1; int t = 0; while (s % 2 == 0) s /= 2, ++t;
        for (int a : {2, 325, 9375, 28178, 450775, 9780504, 1795265022}) { if (!(a %= n)) return true;
            long long f = powmulmod(a, s, n); if (f == 1 || f == n - 1) continue;
            for (int i = 1; i < t; ++i) if ((f = mulmod(f, f, n)) == n - 1) goto nextp;
            return false; nextp:;
        } return true;
    }
     
     
     
    //some modulus and gcd type functions  
     
     
    const int mod = 1e9 + 7 ;
    ll powmod(ll a,ll b) {ll res=1;if(a>=mod)a%=mod;for(;b;b>>=1){if(b&1)res=res*a;if(res>=mod)res%=mod;a=a*a;if(a>=mod)a%=mod;}return res;}
    ll gcd(ll a , ll b){return a==0?b:gcd(b%a,a);}
    // Useful constants
     
     int some_primes[7] = {24443, 100271, 1000003, 1000333, 5000321, 98765431, 1000000123};
     
     
     
     
    #define T9          1000000000
    #define T18         1000000000000000000LL
    #define INF         1011111111
    #define LLINF       1000111000111000111LL
     
    #define EPS         (double)1e-10
    #define PI          3.14159265358979323846264
    #define link        asaxlajrewqwe
    #define rank        wahayawehasdakw
    // modulo
    #define mod %
    #define NUM  1000000007
    #define NUM1 1000000009
    //scanf type macros 
    #define s(n) scanf("%d", &n)
    #define sl(n) scanf("%ld", &n)
    #define sl3(n1,n2,n3) scanf("%lld %lld %lld ", &n1, &n2, &n3)
    #define sl4(n1,n2,n3,n4) scanf("%ld %ld %ld %ld", &n1, &n2, &n3, &n4)
    #define sll(n) scanf("%I64d", &n)
    #define sll2(n) scanf("%lld", &n)
    //printf type macros 
    #define p(n) printf("%d\n", n)
    #define pl(n) printf("%ld\n",n)
    #define pl3(n1,n2,n3) printf("%lld %lld %lld\n ", n1, n2, n3)
    #define pl4(n1,n2,n3,n4) printf("%ld %ld %ld %ld\n ", n1, n2, n3, n4)
    #define pll(n) printf("%I64d\n",n)
    #define pll2(n) printf("%lld\n",n)
     
     
        //*************************************************************************************
    int32_t solve();
    
// C function for extended Euclidean Algorithm
ll gcdExtended(ll a, ll b, ll *x, ll *y);
 
// Function to find modulo inverse of a
ll modInverse(ll a, ll m)
{
    ll x, y;
    ll g = gcdExtended(a, m, &x, &y);
    if (g != 1){}
        // cout << "Inverse doesn't exist";
    else
    {
        // m is added to handle negative x
        ll res = (x%m + m) % m;
        // cout << "Modular multiplicative inverse is " << 
        return res;
    }
}
 
// C function for extended Euclidean Algorithm
ll gcdExtended(ll a, ll b, ll *x, ll *y)
{
    // Base Case
    if (a == 0)
    {
        *x = 0, *y = 1;
        return b;
    }
 
    ll x1, y1; // To store results of recursive call
    ll gcd = gcdExtended(b%a, a, &x1, &y1);
 
    // Update x and y using results of recursive
    // call
    *x = y1 - (b/a) * x1;
    *y = x1;
 
    return gcd;
}
        
     
    int32_t main(int argc, char** argv) {
       
    ios_base::sync_with_stdio(0);cin.tie(0);
    #ifdef LOCAL
              FREIN("input.txt");
              // FREOUT("out.txt");                                                                                                                                               
    #endif
        return solve();
    }
    //red blue ok but i hate palindromes 
    int32_t solve(){
        int t;l jspecial,n,j,q,qi,Li,Ri,prevli,prevri,i;//qi is the query iterator here 
        ll p,x;
        s(t);
        while(t--){
            x=0;
            sl(n),sll2(p),sl(q);
            ll ppA[n];        //prefix product array 
            ll A[n],prod=1;
            FI(n) {sll2(A[i]);prod=(prod*A[i])%p,ppA[i]=prod;}
            
            //for 2 d matrix storing 
            // for (i = 0; i < n; i++) {
            //     /* code */
            //     prod=A[i]%p;
            //     ppA[i][i]=(prod%p);
            // for (j = i+1; j < n; j++) {
            //     /* code */
            //     prod=(prod%p*A[j]%p)%p;
            //     ppA[i][j]=(prod)%p;
            // }
            // prod=1;
            // }
            
            
            
            // for (i = 0; i < n; i++) {
            //     /* code */
                for (j = 0; j < n; j++) {
                    /* code */
                    cout<<ppA[j]<<" ";
                }
                cout<<"\n";
            // }
            
            
            
            
                        
            
            l B[(ll)floor((double)q/(double)64)+2];
            FJ(sizeof(B)/sizeof(B[0])) sl(B[j]);
            // ll sqrtdecompose[(l)ceil(sqrt(n))];
            // builddecompostion(A,p,n,sqrtdecompose);
            // precomputing(A,n,p);
            // l colsize=(l)floor(log(n));
            // ll lookup[n][colsize];
            //sparse table approach preprocessing O(nlogn) query O(1) 
                
            // for (i = 0; i < n; i++) lookup[i][0]=A[i];
            // for (j = 1; (1<<j)<= n; j++)//till logn 
            //     /* code */
            //     for (i = 0; i <= n-(1<<j); i++) {
            //         /* code */
            //         //range 2 ki power hai ya nhi it is an part of an query
            //         lookup[i][j]=((lookup[i][j-1]%p)*((lookup[i+(1<<(j-1))][j-1])%p))%p;
            //     }
            // } //lookup matrix for all possible subarrays of length pow(2,j) for all possible values of j as 0,1,2,3,4,5 up till log(n)
                
             
            //taran rakha                              
            
            for(qi=0;qi<(q);qi++) {
              if(qi%64==0) //here always first it will executes 
             {
                 if(qi==0) x=0;
                 Li = (B[qi/64]  + x)%n, Ri = (B[(qi/64)+1]  + x)%n;
             }
                            
              else {Li = (prevli + x)%n, Ri = (prevri + x)%n;}
              
                        if(Li>Ri) swap(Li,Ri);//O(1) time operation 
                    //   x=(lookup[Li][Ri]+1)%p;
                       //(ans(Li,Ri,A,p,n,sqrtdecompose)
                    //     jspecial=(l)log2(Ri-Li+1);      
                    //     if(jspecial%2==0) {x=(lookup[Li][jspecial]+1)%p;}
                    //   else {
                    //       x=(((lookup[Li][jspecial]+lookup[R-(1<<(jspecial))+1][jspecial])/2)+1)%p;
                    //   }
                       
                    //   if(ppA[Li]!=0)
                        // x=((((ppA[Ri])/ppA[Li-1]))+1)%p;
                        // std::cout << ppA[Li][Ri-Li] << std::endl;
                        
                        
        // <---                    @taran check from here --->
                        
                        
                        x=(((ppA[Ri])*(modInverse(ppA[Li-1],p)))%p+1)%p;
                        //   else  
                                                                       
                                                                       
                       
                        prevli=Li,prevri=Ri;
                
            }
                
            
                
             pll2(x%p);
      
        }
        
        return 0;
    } 
    
    
    
    
    //sq root decompostion tehcnique used 
    
    
    
    // #define MAX 1000000  
    // ll lookup[MAX][MAX]; 
    // void builddecompostion(ll A[],ll p,l n,ll sqrtdecompose[]){
    //     l blocksize=(l)ceil(sqrt(n));
    //     l decomposeitera=0;
    //     ll prod=1;
    //     for (l i = 0; i < n; i++) {
    //             /* code */
    //         prod=((prod*A[i]));
    //         if(i+1%blocksize==0) {
    //                 sqrtdecompose[decomposeitera++]=prod;
    //                 prod=1;
    //         }
            
    //     }    
    // }
        
        
    // ll ans(l Li,l Ri,ll A[],ll p,l n,ll sqrtdecompose[]){
        
    //     l blocksize=(l)ceil(sqrt(n));
    //     // int blockno=Li/blocksize;
    //     ll prod=1;
    //     //case 1 starting case handle alsos true when itis not overlapping any  block  completely 
    //     while(Li%blocksize!=0&&Li<=Ri){
    //         prod=((prod)*A[Li])%p;//add %p here 
    //         Li++;
    //     }
    //     // prod%=p; case 2 for complete overlapping 
    //     while(Li+blocksize<=Ri){
    //         prod=((prod)*((sqrtdecompose[Li/blocksize])))%p;
    //         Li+=blocksize; 
    //     }    
    //     // case3 remainig n unoverlapped elements 
    //     while(Li<=Ri)    {
    //         prod=((prod)*(A[Li]))%p;Li++;//add %p here 
    //     }
        
    //     return prod;
        
    // }
     
        
// 1 approach of the precomputing with theu se of an GLOBAL LOOKUP MATRIX OF SIZE MAX MAX...            
// void precomputing(ll A[],l n,ll p){
//     l i;
//     for (l j= 0; j < (l)log(n); ++j)
//     {
//         i=0;
//         /* code */
//         while(i<n)
//         {
//             /* code */
//             if(j==0) lookup[i][j]=i;
//             else {
//                 lookup[i][j]=((lookup[i][j-1]%p)*(lookup[i + (1<<(j-1))][j-1])%p)%p;
//             }
//             i++; 
//         }
//     }

// }    