wiki:Sting
---------------------------------------------
   4 Processor run, global<128,128,128>
   for 100 time steps
main timer : (real:0:1:8,user:0:1:6,sys:0:0:1)[clk:6860]
	loop : (real:0:0:35,user:0:0:34,sys:0:0:1)[clk:3586]	(100 calls X 3.586000e+01)
	FFT timer : (real:0:0:54,user:0:0:53,sys:0:0:0)[clk:5402]
		planification time : (real:0:0:31,user:0:0:31,sys:0:0:0)[clk:3179]
		FFT and transposition time : (real:0:0:22,user:0:0:21,sys:0:0:0)[clk:2223]	(509 calls X 4.367387e+00)
			FFT only : (real:0:0:14,user:0:0:13,sys:0:0:0)[clk:1429]	(2545 calls X 5.614931e-01)
			Transposition only : (real:0:0:6,user:0:0:6,sys:0:0:0)[clk:611]	(1832 calls X 3.335153e-01)
	azur::array timer root : (real:0:0:7,user:0:0:7,sys:0:0:0)[clk:774]
		view = expr : (real:0:0:7,user:0:0:7,sys:0:0:0)[clk:774]	(2538 calls X 3.049645e-01)
			fftw3<dbl> id= dbl : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:79]	(510 calls X 1.549020e-01)
			fftw3<dbl> /= dbl : (real:0:0:0,user:0:0:1,sys:0:0:0)[clk:99]	(612 calls X 1.617647e-01)
			fftw4<dbl> id= dbl : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:1]	(1 calls X 1.000000e+00)
			fftw3<dbl> id= fftw3<dbl> : (real:0:0:1,user:0:0:1,sys:0:0:0)[clk:119]	(606 calls X 1.963696e-01)
			fftw3<dbl> *= dbl : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:1]	(3 calls X 3.333333e-01)
			fftw4<cdbl> id= fftw4<cdbl> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:94]	(202 calls X 4.653465e-01)
			fftw4<dbl> id= fftw4<dbl> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:50]	(103 calls X 4.854369e-01)
			fftw4<cdbl> id= (s2v<basic3<dbl>> * ((fftw4<cdbl> * dbl) + fftw4<cdbl>)) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:1]	(1 calls X 1.000000e+00)
			fftw4<cdbl> id= (s2v<basic3<dbl>> * ((fftw4<cdbl> * dbl) + fftw4<cdbl>)) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:1]	(1 calls X 1.000000e+00)
			fftw4<cdbl> id= (s2v<basic3<dbl>> * (fftw4<cdbl> * dbl)) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:1]	(1 calls X 1.000000e+00)
			fftw4<cdbl> *= s2v<basic3<dbl>> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:1]	(1 calls X 1.000000e+00)
			fftw4<cdbl> += fftw4<cdbl> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:0]	(1 calls X 0.000000e+00)
			fftw4<cdbl> id= ((fftw4<cdbl> * s2v<basic3<dbl>>) + (s2v<basic3<dbl>> * (fftw4<cdbl> * dbl))) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:1]	(1 calls X 
1.000000e+00)
			fftw4<cdbl> id= ((fftw4<cdbl> * dbl) * s2v<basic3<dbl>>) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:60]	(99 calls X 6.060606e-01)
			fftw4<cdbl> -= fftw4<cdbl> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:54]	(99 calls X 5.454546e-01)
			fftw4<cdbl> -= ((fftw4<cdbl> * dbl) * s2v<basic3<dbl>>) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:71]	(99 calls X 7.171717e-01)
			fftw4<cdbl> id= (s2v<basic3<dbl>> swp(*) (fftw4<cdbl> + (fftw4<cdbl> * dbl))) : (real:0:0:1,user:0:0:1,sys:0:0:0)[clk:139]	(198 calls X 7.020202e-01)
	cubby::field timer root : (real:0:0:12,user:0:0:13,sys:0:0:0)[clk:1299]
		scalar::transpose_blocks_when_received : (real:0:0:6,user:0:0:7,sys:0:0:0)[clk:693]	(3054 calls X 2.269155e-01)
			scalar::copy_transposed : (real:0:0:2,user:0:0:2,sys:0:0:0)[clk:202]	(6108 calls X 3.307138e-02)
		vector::in_place_curl : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:85]	(202 calls X 4.207921e-01)
		scalar::local_energy : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:8]	(66 calls X 1.212121e-01)
		vector::vec_prod : (real:0:0:1,user:0:0:1,sys:0:0:0)[clk:112]	(202 calls X 5.544555e-01)
		vector::project : (real:0:0:1,user:0:0:1,sys:0:0:0)[clk:173]	(101 calls X 1.712871e+00)
		scalar::dealias : (real:0:0:2,user:0:0:2,sys:0:0:0)[clk:225]	(606 calls X 3.712871e-01)
 ---------------------------------------------
   8 Processor run, global<128,128,128>
   for 100 time steps
main timer : (real:0:0:47,user:0:0:45,sys:0:0:1)[clk:4746]
	loop : (real:0:0:23,user:0:0:22,sys:0:0:1)[clk:2370]	(100 calls X 2.370000e+01)
	FFT timer : (real:0:0:37,user:0:0:36,sys:0:0:0)[clk:3714]
		planification time : (real:0:0:23,user:0:0:22,sys:0:0:0)[clk:2301]
		FFT and transposition time : (real:0:0:14,user:0:0:13,sys:0:0:0)[clk:1413]	(509 calls X 2.776031e+00)
			FFT only : (real:0:0:6,user:0:0:7,sys:0:0:0)[clk:683]	(2545 calls X 2.683693e-01)
			Transposition only : (real:0:0:5,user:0:0:5,sys:0:0:0)[clk:587]	(1832 calls X 3.204148e-01)
	azur::array timer root : (real:0:0:6,user:0:0:5,sys:0:0:0)[clk:646]
		view = expr : (real:0:0:6,user:0:0:5,sys:0:0:0)[clk:645]	(2538 calls X 2.541371e-01)
			fftw3<dbl> id= dbl : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:56]	(510 calls X 1.098039e-01)
			fftw3<dbl> /= dbl : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:73]	(612 calls X 1.192810e-01)
			fftw4<dbl> id= dbl : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:0]	(1 calls X 0.000000e+00)
			fftw3<dbl> id= fftw3<dbl> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:91]	(606 calls X 1.501650e-01)
			fftw3<dbl> *= dbl : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:0]	(3 calls X 0.000000e+00)
			fftw4<cdbl> id= fftw4<cdbl> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:92]	(202 calls X 4.554456e-01)
			fftw4<dbl> id= fftw4<dbl> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:58]	(103 calls X 5.631068e-01)
			fftw4<cdbl> id= (s2v<basic3<dbl>> * ((fftw4<cdbl> * dbl) + fftw4<cdbl>)) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:1]	(1 calls X 1.000000e+00)
			fftw4<cdbl> id= (s2v<basic3<dbl>> * ((fftw4<cdbl> * dbl) + fftw4<cdbl>)) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:0]	(1 calls X 0.000000e+00)
			fftw4<cdbl> id= (s2v<basic3<dbl>> * (fftw4<cdbl> * dbl)) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:0]	(1 calls X 0.000000e+00)
			fftw4<cdbl> *= s2v<basic3<dbl>> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:1]	(1 calls X 1.000000e+00)
			fftw4<cdbl> += fftw4<cdbl> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:0]	(1 calls X 0.000000e+00)
			fftw4<cdbl> id= ((fftw4<cdbl> * s2v<basic3<dbl>>) + (s2v<basic3<dbl>> * (fftw4<cdbl> * dbl))) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:1]	(1 calls X 
1.000000e+00)
			fftw4<cdbl> id= ((fftw4<cdbl> * dbl) * s2v<basic3<dbl>>) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:57]	(99 calls X 5.757576e-01)
			fftw4<cdbl> -= fftw4<cdbl> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:51]	(99 calls X 5.151515e-01)
			fftw4<cdbl> -= ((fftw4<cdbl> * dbl) * s2v<basic3<dbl>>) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:50]	(99 calls X 5.050505e-01)
			fftw4<cdbl> id= (s2v<basic3<dbl>> swp(*) (fftw4<cdbl> + (fftw4<cdbl> * dbl))) : (real:0:0:1,user:0:0:1,sys:0:0:0)[clk:110]	(198 calls X 5.555556e-01)
	cubby::field timer root : (real:0:0:9,user:0:0:9,sys:0:0:0)[clk:998]
		scalar::transpose_blocks_when_received : (real:0:0:6,user:0:0:6,sys:0:0:0)[clk:654]	(3054 calls X 2.141454e-01)
			scalar::copy_transposed : (real:0:0:1,user:0:0:1,sys:0:0:0)[clk:165]	(12216 calls X 1.350688e-02)
		vector::in_place_curl : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:58]	(202 calls X 2.871287e-01)
		scalar::local_energy : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:3]	(66 calls X 4.545455e-02)
		vector::vec_prod : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:92]	(202 calls X 4.554456e-01)
		vector::project : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:83]	(101 calls X 8.217822e-01)
		scalar::dealias : (real:0:0:1,user:0:0:1,sys:0:0:0)[clk:107]	(606 calls X 1.765677e-01)

  8 Processor run, global<256,256,256>
   for 100 time steps
main timer : (real:0:5:53,user:0:5:41,sys:0:0:11)[clk:35314]
	loop : (real:0:3:21,user:0:3:10,sys:0:0:10)[clk:20150]	(100 calls X 2.015000e+02)
	FFT timer : (real:0:4:31,user:0:4:28,sys:0:0:3)[clk:27168]
		planification time : (real:0:2:26,user:0:2:25,sys:0:0:0)[clk:14643]
		FFT and transposition time : (real:0:2:5,user:0:2:2,sys:0:0:2)[clk:12524]	(509 calls X 2.460511e+01)
			FFT only : (real:0:1:12,user:0:1:11,sys:0:0:0)[clk:7221]	(2545 calls X 2.837328e+00)
			Transposition only : (real:0:0:42,user:0:0:39,sys:0:0:2)[clk:4205]	(1832 calls X 2.295306e+00)
	azur::array timer root : (real:0:0:48,user:0:0:45,sys:0:0:3)[clk:4859]
		view = expr : (real:0:0:48,user:0:0:45,sys:0:0:3)[clk:4858]	(2538 calls X 1.914106e+00)
			fftw3<dbl> id= dbl : (real:0:0:4,user:0:0:1,sys:0:0:3)[clk:466]	(510 calls X 9.137255e-01)
			fftw3<dbl> /= dbl : (real:0:0:4,user:0:0:4,sys:0:0:0)[clk:466]	(612 calls X 7.614379e-01)
			fftw4<dbl> id= dbl : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:2]	(1 calls X 2.000000e+00)
			fftw3<dbl> id= fftw3<dbl> : (real:0:0:7,user:0:0:7,sys:0:0:0)[clk:729]	(606 calls X 1.202970e+00)
			fftw3<dbl> *= dbl : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:2]	(3 calls X 6.666667e-01)
			fftw4<cdbl> id= fftw4<cdbl> : (real:0:0:7,user:0:0:7,sys:0:0:0)[clk:747]	(202 calls X 3.698020e+00)
			fftw4<dbl> id= fftw4<dbl> : (real:0:0:3,user:0:0:3,sys:0:0:0)[clk:351]	(103 calls X 3.407767e+00)
			fftw4<cdbl> id= (s2v<basic3<dbl>> * ((fftw4<cdbl> * dbl) + fftw4<cdbl>)) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:4]	(1 calls X 4.000000e+00)
			fftw4<cdbl> id= (s2v<basic3<dbl>> * ((fftw4<cdbl> * dbl) + fftw4<cdbl>)) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:4]	(1 calls X 4.000000e+00)
			fftw4<cdbl> id= (s2v<basic3<dbl>> * (fftw4<cdbl> * dbl)) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:5]	(1 calls X 5.000000e+00)
			fftw4<cdbl> *= s2v<basic3<dbl>> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:3]	(1 calls X 3.000000e+00)
			fftw4<cdbl> += fftw4<cdbl> : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:4]	(1 calls X 4.000000e+00)
			fftw4<cdbl> id= ((fftw4<cdbl> * s2v<basic3<dbl>>) + (s2v<basic3<dbl>> * (fftw4<cdbl> * dbl))) : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:5]	(1 calls X 
5.000000e+00)
			fftw4<cdbl> id= ((fftw4<cdbl> * dbl) * s2v<basic3<dbl>>) : (real:0:0:4,user:0:0:4,sys:0:0:0)[clk:454]	(99 calls X 4.585859e+00)
			fftw4<cdbl> -= fftw4<cdbl> : (real:0:0:3,user:0:0:3,sys:0:0:0)[clk:365]	(99 calls X 3.686869e+00)
			fftw4<cdbl> -= ((fftw4<cdbl> * dbl) * s2v<basic3<dbl>>) : (real:0:0:4,user:0:0:4,sys:0:0:0)[clk:417]	(99 calls X 4.212121e+00)
			fftw4<cdbl> id= (s2v<basic3<dbl>> swp(*) (fftw4<cdbl> + (fftw4<cdbl> * dbl))) : (real:0:0:8,user:0:0:8,sys:0:0:0)[clk:834]	(198 calls X 4.212121e+00)
	cubby::field timer root : (real:0:1:16,user:0:1:13,sys:0:0:2)[clk:7631]
		scalar::transpose_blocks_when_received : (real:0:0:48,user:0:0:45,sys:0:0:2)[clk:4835]	(3054 calls X 1.583170e+00)
			scalar::copy_transposed : (real:0:0:16,user:0:0:15,sys:0:0:0)[clk:1611]	(12216 calls X 1.318762e-01)
		vector::in_place_curl : (real:0:0:4,user:0:0:4,sys:0:0:0)[clk:480]	(202 calls X 2.376238e+00)
		scalar::local_energy : (real:0:0:0,user:0:0:0,sys:0:0:0)[clk:31]	(66 calls X 4.696970e-01)
		vector::vec_prod : (real:0:0:7,user:0:0:7,sys:0:0:0)[clk:721]	(202 calls X 3.569307e+00)
		vector::project : (real:0:0:6,user:0:0:6,sys:0:0:0)[clk:695]	(101 calls X 6.881188e+00)
		scalar::dealias : (real:0:0:8,user:0:0:8,sys:0:0:0)[clk:869]	(606 calls X 1.433993e+00)

Last modified 10 years ago Last modified on Mar 23, 2011 5:06:38 PM