Advertisement
Guest User

Sin Optimization icpc_O3

a guest
Feb 4th, 2014
134
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 12.64 KB | None | 0 0
  1. icpc_O3: file format elf64-x86-64
  2.  
  3.  
  4. 0000000000401c80 <sin1(double)>:
  5. 401c80: 0f 28 c8 movaps %xmm0,%xmm1
  6. 401c83: f2 0f 59 c8 mulsd %xmm0,%xmm1
  7. 401c87: f2 0f 59 0d d1 3b 00 mulsd 0x3bd1(%rip),%xmm1 # 405860 <.L_2il0floatpacket.440+0x50>
  8. 401c8e: 00
  9. 401c8f: f2 0f 58 0d c1 3b 00 addsd 0x3bc1(%rip),%xmm1 # 405858 <.L_2il0floatpacket.440+0x48>
  10. 401c96: 00
  11. 401c97: f2 0f 59 c8 mulsd %xmm0,%xmm1
  12. 401c9b: f2 0f 59 c8 mulsd %xmm0,%xmm1
  13. 401c9f: f2 0f 58 0d c1 3b 00 addsd 0x3bc1(%rip),%xmm1 # 405868 <.L_2il0floatpacket.440+0x58>
  14. 401ca6: 00
  15. 401ca7: f2 0f 59 c8 mulsd %xmm0,%xmm1
  16. 401cab: f2 0f 59 c8 mulsd %xmm0,%xmm1
  17. 401caf: f2 0f 58 0d b9 3b 00 addsd 0x3bb9(%rip),%xmm1 # 405870 <.L_2il0floatpacket.440+0x60>
  18. 401cb6: 00
  19. 401cb7: f2 0f 59 c8 mulsd %xmm0,%xmm1
  20. 401cbb: f2 0f 59 c8 mulsd %xmm0,%xmm1
  21. 401cbf: f2 0f 58 0d b1 3b 00 addsd 0x3bb1(%rip),%xmm1 # 405878 <.L_2il0floatpacket.440+0x68>
  22. 401cc6: 00
  23. 401cc7: f2 0f 59 c8 mulsd %xmm0,%xmm1
  24. 401ccb: f2 0f 59 c8 mulsd %xmm0,%xmm1
  25. 401ccf: f2 0f 58 0d a9 3b 00 addsd 0x3ba9(%rip),%xmm1 # 405880 <.L_2il0floatpacket.440+0x70>
  26. 401cd6: 00
  27. 401cd7: f2 0f 59 c8 mulsd %xmm0,%xmm1
  28. 401cdb: f2 0f 59 c8 mulsd %xmm0,%xmm1
  29. 401cdf: f2 0f 58 0d a1 3b 00 addsd 0x3ba1(%rip),%xmm1 # 405888 <.L_2il0floatpacket.440+0x78>
  30. 401ce6: 00
  31. 401ce7: f2 0f 59 c8 mulsd %xmm0,%xmm1
  32. 401ceb: f2 0f 59 c8 mulsd %xmm0,%xmm1
  33. 401cef: f2 0f 59 c8 mulsd %xmm0,%xmm1
  34. 401cf3: f2 0f 58 c1 addsd %xmm1,%xmm0
  35. 401cf7: c3 retq
  36. 401cf8: 0f 1f 84 00 00 00 00 nopl 0x0(%rax,%rax,1)
  37. 401cff: 00
  38.  
  39. 0000000000401d00 <sin2(double)>:
  40. 401d00: 0f 28 e8 movaps %xmm0,%xmm5
  41. 401d03: f2 0f 59 e8 mulsd %xmm0,%xmm5
  42. 401d07: 0f 28 f0 movaps %xmm0,%xmm6
  43. 401d0a: f2 0f 59 f5 mulsd %xmm5,%xmm6
  44. 401d0e: f2 0f 10 0d 72 3b 00 movsd 0x3b72(%rip),%xmm1 # 405888 <.L_2il0floatpacket.440+0x78>
  45. 401d15: 00
  46. 401d16: f2 0f 10 3d 42 3b 00 movsd 0x3b42(%rip),%xmm7 # 405860 <.L_2il0floatpacket.440+0x50>
  47. 401d1d: 00
  48. 401d1e: f2 0f 59 ce mulsd %xmm6,%xmm1
  49. 401d22: f2 0f 59 f5 mulsd %xmm5,%xmm6
  50. 401d26: f2 0f 59 fd mulsd %xmm5,%xmm7
  51. 401d2a: f2 0f 58 c1 addsd %xmm1,%xmm0
  52. 401d2e: f2 0f 58 3d 22 3b 00 addsd 0x3b22(%rip),%xmm7 # 405858 <.L_2il0floatpacket.440+0x48>
  53. 401d35: 00
  54. 401d36: f2 0f 10 15 42 3b 00 movsd 0x3b42(%rip),%xmm2 # 405880 <.L_2il0floatpacket.440+0x70>
  55. 401d3d: 00
  56. 401d3e: f2 0f 59 d6 mulsd %xmm6,%xmm2
  57. 401d42: f2 0f 59 f5 mulsd %xmm5,%xmm6
  58. 401d46: f2 0f 59 fd mulsd %xmm5,%xmm7
  59. 401d4a: f2 0f 58 c2 addsd %xmm2,%xmm0
  60. 401d4e: f2 0f 58 3d 12 3b 00 addsd 0x3b12(%rip),%xmm7 # 405868 <.L_2il0floatpacket.440+0x58>
  61. 401d55: 00
  62. 401d56: f2 0f 10 1d 1a 3b 00 movsd 0x3b1a(%rip),%xmm3 # 405878 <.L_2il0floatpacket.440+0x68>
  63. 401d5d: 00
  64. 401d5e: f2 0f 59 de mulsd %xmm6,%xmm3
  65. 401d62: f2 0f 59 f5 mulsd %xmm5,%xmm6
  66. 401d66: f2 0f 58 c3 addsd %xmm3,%xmm0
  67. 401d6a: f2 0f 10 25 fe 3a 00 movsd 0x3afe(%rip),%xmm4 # 405870 <.L_2il0floatpacket.440+0x60>
  68. 401d71: 00
  69. 401d72: f2 0f 59 e6 mulsd %xmm6,%xmm4
  70. 401d76: f2 0f 59 f5 mulsd %xmm5,%xmm6
  71. 401d7a: f2 0f 58 c4 addsd %xmm4,%xmm0
  72. 401d7e: f2 0f 59 fe mulsd %xmm6,%xmm7
  73. 401d82: f2 0f 58 c7 addsd %xmm7,%xmm0
  74. 401d86: c3 retq
  75. 401d87: 66 0f 1f 84 00 00 00 nopw 0x0(%rax,%rax,1)
  76. 401d8e: 00 00
  77.  
  78. 0000000000401d90 <sin3(double)>:
  79. 401d90: 0f 28 d0 movaps %xmm0,%xmm2
  80. 401d93: f2 0f 59 d0 mulsd %xmm0,%xmm2
  81. 401d97: f2 0f 10 0d c1 3a 00 movsd 0x3ac1(%rip),%xmm1 # 405860 <.L_2il0floatpacket.440+0x50>
  82. 401d9e: 00
  83. 401d9f: f2 0f 59 ca mulsd %xmm2,%xmm1
  84. 401da3: f2 0f 58 0d ad 3a 00 addsd 0x3aad(%rip),%xmm1 # 405858 <.L_2il0floatpacket.440+0x48>
  85. 401daa: 00
  86. 401dab: f2 0f 59 ca mulsd %xmm2,%xmm1
  87. 401daf: f2 0f 58 0d b1 3a 00 addsd 0x3ab1(%rip),%xmm1 # 405868 <.L_2il0floatpacket.440+0x58>
  88. 401db6: 00
  89. 401db7: f2 0f 59 ca mulsd %xmm2,%xmm1
  90. 401dbb: f2 0f 58 0d ad 3a 00 addsd 0x3aad(%rip),%xmm1 # 405870 <.L_2il0floatpacket.440+0x60>
  91. 401dc2: 00
  92. 401dc3: f2 0f 59 ca mulsd %xmm2,%xmm1
  93. 401dc7: f2 0f 58 0d a9 3a 00 addsd 0x3aa9(%rip),%xmm1 # 405878 <.L_2il0floatpacket.440+0x68>
  94. 401dce: 00
  95. 401dcf: f2 0f 59 ca mulsd %xmm2,%xmm1
  96. 401dd3: f2 0f 58 0d a5 3a 00 addsd 0x3aa5(%rip),%xmm1 # 405880 <.L_2il0floatpacket.440+0x70>
  97. 401dda: 00
  98. 401ddb: f2 0f 59 ca mulsd %xmm2,%xmm1
  99. 401ddf: f2 0f 58 0d a1 3a 00 addsd 0x3aa1(%rip),%xmm1 # 405888 <.L_2il0floatpacket.440+0x78>
  100. 401de6: 00
  101. 401de7: f2 0f 59 d1 mulsd %xmm1,%xmm2
  102. 401deb: f2 0f 58 15 9d 3a 00 addsd 0x3a9d(%rip),%xmm2 # 405890 <.L_2il0floatpacket.440+0x80>
  103. 401df2: 00
  104. 401df3: f2 0f 59 c2 mulsd %xmm2,%xmm0
  105. 401df7: c3 retq
  106. 401df8: 0f 1f 84 00 00 00 00 nopl 0x0(%rax,%rax,1)
  107. 401dff: 00
  108.  
  109. 0000000000401e00 <sin4(double)>:
  110. 401e00: 0f 28 d8 movaps %xmm0,%xmm3
  111. 401e03: f2 0f 59 d8 mulsd %xmm0,%xmm3
  112. 401e07: 0f 28 d3 movaps %xmm3,%xmm2
  113. 401e0a: f2 0f 59 d3 mulsd %xmm3,%xmm2
  114. 401e0e: f2 0f 10 25 42 3a 00 movsd 0x3a42(%rip),%xmm4 # 405858 <.L_2il0floatpacket.440+0x48>
  115. 401e15: 00
  116. 401e16: f2 0f 10 0d 42 3a 00 movsd 0x3a42(%rip),%xmm1 # 405860 <.L_2il0floatpacket.440+0x50>
  117. 401e1d: 00
  118. 401e1e: f2 0f 59 e2 mulsd %xmm2,%xmm4
  119. 401e22: f2 0f 59 ca mulsd %xmm2,%xmm1
  120. 401e26: f2 0f 58 25 42 3a 00 addsd 0x3a42(%rip),%xmm4 # 405870 <.L_2il0floatpacket.440+0x60>
  121. 401e2d: 00
  122. 401e2e: f2 0f 58 0d 32 3a 00 addsd 0x3a32(%rip),%xmm1 # 405868 <.L_2il0floatpacket.440+0x58>
  123. 401e35: 00
  124. 401e36: f2 0f 59 e2 mulsd %xmm2,%xmm4
  125. 401e3a: f2 0f 59 ca mulsd %xmm2,%xmm1
  126. 401e3e: f2 0f 58 25 3a 3a 00 addsd 0x3a3a(%rip),%xmm4 # 405880 <.L_2il0floatpacket.440+0x70>
  127. 401e45: 00
  128. 401e46: f2 0f 58 0d 2a 3a 00 addsd 0x3a2a(%rip),%xmm1 # 405878 <.L_2il0floatpacket.440+0x68>
  129. 401e4d: 00
  130. 401e4e: f2 0f 59 e2 mulsd %xmm2,%xmm4
  131. 401e52: f2 0f 59 d1 mulsd %xmm1,%xmm2
  132. 401e56: f2 0f 58 25 32 3a 00 addsd 0x3a32(%rip),%xmm4 # 405890 <.L_2il0floatpacket.440+0x80>
  133. 401e5d: 00
  134. 401e5e: f2 0f 58 15 22 3a 00 addsd 0x3a22(%rip),%xmm2 # 405888 <.L_2il0floatpacket.440+0x78>
  135. 401e65: 00
  136. 401e66: f2 0f 59 da mulsd %xmm2,%xmm3
  137. 401e6a: f2 0f 58 e3 addsd %xmm3,%xmm4
  138. 401e6e: f2 0f 59 c4 mulsd %xmm4,%xmm0
  139. 401e72: c3 retq
  140. 401e73: 0f 1f 44 00 00 nopl 0x0(%rax,%rax,1)
  141. 401e78: 0f 1f 84 00 00 00 00 nopl 0x0(%rax,%rax,1)
  142. 401e7f: 00
  143.  
  144. 0000000000401e80 <sin5(double)>:
  145. 401e80: 0f 28 d0 movaps %xmm0,%xmm2
  146. 401e83: f2 0f 59 d0 mulsd %xmm0,%xmm2
  147. 401e87: 0f 28 ea movaps %xmm2,%xmm5
  148. 401e8a: 0f 28 e2 movaps %xmm2,%xmm4
  149. 401e8d: f2 0f 59 ea mulsd %xmm2,%xmm5
  150. 401e91: f2 0f 59 e5 mulsd %xmm5,%xmm4
  151. 401e95: f2 0f 10 0d c3 39 00 movsd 0x39c3(%rip),%xmm1 # 405860 <.L_2il0floatpacket.440+0x50>
  152. 401e9c: 00
  153. 401e9d: f2 0f 59 cc mulsd %xmm4,%xmm1
  154. 401ea1: f2 0f 10 35 af 39 00 movsd 0x39af(%rip),%xmm6 # 405858 <.L_2il0floatpacket.440+0x48>
  155. 401ea8: 00
  156. 401ea9: f2 0f 59 f4 mulsd %xmm4,%xmm6
  157. 401ead: f2 0f 58 0d bb 39 00 addsd 0x39bb(%rip),%xmm1 # 405870 <.L_2il0floatpacket.440+0x60>
  158. 401eb4: 00
  159. 401eb5: f2 0f 59 cc mulsd %xmm4,%xmm1
  160. 401eb9: f2 0f 58 35 b7 39 00 addsd 0x39b7(%rip),%xmm6 # 405878 <.L_2il0floatpacket.440+0x68>
  161. 401ec0: 00
  162. 401ec1: f2 0f 10 1d 9f 39 00 movsd 0x399f(%rip),%xmm3 # 405868 <.L_2il0floatpacket.440+0x58>
  163. 401ec8: 00
  164. 401ec9: f2 0f 59 f4 mulsd %xmm4,%xmm6
  165. 401ecd: f2 0f 58 0d b3 39 00 addsd 0x39b3(%rip),%xmm1 # 405888 <.L_2il0floatpacket.440+0x78>
  166. 401ed4: 00
  167. 401ed5: f2 0f 59 e3 mulsd %xmm3,%xmm4
  168. 401ed9: f2 0f 59 d1 mulsd %xmm1,%xmm2
  169. 401edd: f2 0f 58 35 ab 39 00 addsd 0x39ab(%rip),%xmm6 # 405890 <.L_2il0floatpacket.440+0x80>
  170. 401ee4: 00
  171. 401ee5: f2 0f 58 25 93 39 00 addsd 0x3993(%rip),%xmm4 # 405880 <.L_2il0floatpacket.440+0x70>
  172. 401eec: 00
  173. 401eed: f2 0f 58 f2 addsd %xmm2,%xmm6
  174. 401ef1: f2 0f 59 ec mulsd %xmm4,%xmm5
  175. 401ef5: f2 0f 58 f5 addsd %xmm5,%xmm6
  176. 401ef9: f2 0f 59 c6 mulsd %xmm6,%xmm0
  177. 401efd: c3 retq
  178. 401efe: 66 90 xchg %ax,%ax
  179.  
  180. 0000000000401f00 <sin6(double)>:
  181. 401f00: 0f 28 d0 movaps %xmm0,%xmm2
  182. 401f03: f2 0f 59 d0 mulsd %xmm0,%xmm2
  183. 401f07: f2 0f 10 25 69 39 00 movsd 0x3969(%rip),%xmm4 # 405878 <.L_2il0floatpacket.440+0x68>
  184. 401f0e: 00
  185. 401f0f: 0f 28 da movaps %xmm2,%xmm3
  186. 401f12: f2 0f 10 0d 46 39 00 movsd 0x3946(%rip),%xmm1 # 405860 <.L_2il0floatpacket.440+0x50>
  187. 401f19: 00
  188. 401f1a: f2 0f 59 e2 mulsd %xmm2,%xmm4
  189. 401f1e: f2 0f 59 ca mulsd %xmm2,%xmm1
  190. 401f22: f2 0f 59 da mulsd %xmm2,%xmm3
  191. 401f26: f2 0f 58 25 52 39 00 addsd 0x3952(%rip),%xmm4 # 405880 <.L_2il0floatpacket.440+0x70>
  192. 401f2d: 00
  193. 401f2e: f2 0f 58 0d 22 39 00 addsd 0x3922(%rip),%xmm1 # 405858 <.L_2il0floatpacket.440+0x48>
  194. 401f35: 00
  195. 401f36: f2 0f 59 db mulsd %xmm3,%xmm3
  196. 401f3a: f2 0f 59 e2 mulsd %xmm2,%xmm4
  197. 401f3e: f2 0f 59 ca mulsd %xmm2,%xmm1
  198. 401f42: f2 0f 58 25 3e 39 00 addsd 0x393e(%rip),%xmm4 # 405888 <.L_2il0floatpacket.440+0x78>
  199. 401f49: 00
  200. 401f4a: f2 0f 58 0d 16 39 00 addsd 0x3916(%rip),%xmm1 # 405868 <.L_2il0floatpacket.440+0x58>
  201. 401f51: 00
  202. 401f52: f2 0f 59 e2 mulsd %xmm2,%xmm4
  203. 401f56: f2 0f 59 d1 mulsd %xmm1,%xmm2
  204. 401f5a: f2 0f 58 25 2e 39 00 addsd 0x392e(%rip),%xmm4 # 405890 <.L_2il0floatpacket.440+0x80>
  205. 401f61: 00
  206. 401f62: f2 0f 58 15 06 39 00 addsd 0x3906(%rip),%xmm2 # 405870 <.L_2il0floatpacket.440+0x60>
  207. 401f69: 00
  208. 401f6a: f2 0f 59 da mulsd %xmm2,%xmm3
  209. 401f6e: f2 0f 58 e3 addsd %xmm3,%xmm4
  210. 401f72: f2 0f 59 c4 mulsd %xmm4,%xmm0
  211. 401f76: c3 retq
  212. 401f77: 66 0f 1f 84 00 00 00 nopw 0x0(%rax,%rax,1)
  213. 401f7e: 00 00
  214.  
  215. 0000000000401f80 <sin7(double)>:
  216. 401f80: 0f 28 e8 movaps %xmm0,%xmm5
  217. 401f83: f2 0f 59 e8 mulsd %xmm0,%xmm5
  218. 401f87: 0f 28 f8 movaps %xmm0,%xmm7
  219. 401f8a: 0f 28 d5 movaps %xmm5,%xmm2
  220. 401f8d: 0f 28 f0 movaps %xmm0,%xmm6
  221. 401f90: f2 0f 59 d5 mulsd %xmm5,%xmm2
  222. 401f94: f2 0f 59 fd mulsd %xmm5,%xmm7
  223. 401f98: 0f 28 ca movaps %xmm2,%xmm1
  224. 401f9b: f2 0f 59 ca mulsd %xmm2,%xmm1
  225. 401f9f: f2 0f 59 f1 mulsd %xmm1,%xmm6
  226. 401fa3: f2 0f 10 25 b5 38 00 movsd 0x38b5(%rip),%xmm4 # 405860 <.L_2il0floatpacket.440+0x50>
  227. 401faa: 00
  228. 401fab: f2 0f 59 e5 mulsd %xmm5,%xmm4
  229. 401faf: f2 0f 10 1d c1 38 00 movsd 0x38c1(%rip),%xmm3 # 405878 <.L_2il0floatpacket.440+0x68>
  230. 401fb6: 00
  231. 401fb7: f2 0f 59 dd mulsd %xmm5,%xmm3
  232. 401fbb: f2 0f 58 25 95 38 00 addsd 0x3895(%rip),%xmm4 # 405858 <.L_2il0floatpacket.440+0x48>
  233. 401fc2: 00
  234. 401fc3: f2 0f 59 e5 mulsd %xmm5,%xmm4
  235. 401fc7: f2 0f 58 1d b1 38 00 addsd 0x38b1(%rip),%xmm3 # 405880 <.L_2il0floatpacket.440+0x70>
  236. 401fce: 00
  237. 401fcf: f2 0f 59 dd mulsd %xmm5,%xmm3
  238. 401fd3: f2 0f 58 25 8d 38 00 addsd 0x388d(%rip),%xmm4 # 405868 <.L_2il0floatpacket.440+0x58>
  239. 401fda: 00
  240. 401fdb: f2 0f 59 ec mulsd %xmm4,%xmm5
  241. 401fdf: f2 0f 58 1d a1 38 00 addsd 0x38a1(%rip),%xmm3 # 405888 <.L_2il0floatpacket.440+0x78>
  242. 401fe6: 00
  243. 401fe7: f2 0f 59 fb mulsd %xmm3,%xmm7
  244. 401feb: f2 0f 58 2d 7d 38 00 addsd 0x387d(%rip),%xmm5 # 405870 <.L_2il0floatpacket.440+0x60>
  245. 401ff2: 00
  246. 401ff3: f2 0f 59 f5 mulsd %xmm5,%xmm6
  247. 401ff7: f2 0f 58 fe addsd %xmm6,%xmm7
  248. 401ffb: f2 0f 58 c7 addsd %xmm7,%xmm0
  249. 401fff: c3 retq
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement