asm.h 6.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154
  1. /*
  2. * copyright (c) 2006 Michael Niedermayer <michaelni@gmx.at>
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. #ifndef AVUTIL_X86_ASM_H
  21. #define AVUTIL_X86_ASM_H
  22. #include <stdint.h>
  23. #include "config.h"
  24. typedef struct xmm_reg { uint64_t a, b; } xmm_reg;
  25. typedef struct ymm_reg { uint64_t a, b, c, d; } ymm_reg;
  26. #if ARCH_X86_64
  27. # define FF_OPSIZE "q"
  28. # define FF_REG_a "rax"
  29. # define FF_REG_b "rbx"
  30. # define FF_REG_c "rcx"
  31. # define FF_REG_d "rdx"
  32. # define FF_REG_D "rdi"
  33. # define FF_REG_S "rsi"
  34. # define FF_PTR_SIZE "8"
  35. typedef int64_t x86_reg;
  36. /* FF_REG_SP is defined in Solaris sys headers, so use FF_REG_sp */
  37. # define FF_REG_sp "rsp"
  38. # define FF_REG_BP "rbp"
  39. # define FF_REGBP rbp
  40. # define FF_REGa rax
  41. # define FF_REGb rbx
  42. # define FF_REGc rcx
  43. # define FF_REGd rdx
  44. # define FF_REGSP rsp
  45. #elif ARCH_X86_32
  46. # define FF_OPSIZE "l"
  47. # define FF_REG_a "eax"
  48. # define FF_REG_b "ebx"
  49. # define FF_REG_c "ecx"
  50. # define FF_REG_d "edx"
  51. # define FF_REG_D "edi"
  52. # define FF_REG_S "esi"
  53. # define FF_PTR_SIZE "4"
  54. typedef int32_t x86_reg;
  55. # define FF_REG_sp "esp"
  56. # define FF_REG_BP "ebp"
  57. # define FF_REGBP ebp
  58. # define FF_REGa eax
  59. # define FF_REGb ebx
  60. # define FF_REGc ecx
  61. # define FF_REGd edx
  62. # define FF_REGSP esp
  63. #else
  64. typedef int x86_reg;
  65. #endif
  66. #define HAVE_7REGS (ARCH_X86_64 || (HAVE_EBX_AVAILABLE && HAVE_EBP_AVAILABLE))
  67. #define HAVE_6REGS (ARCH_X86_64 || (HAVE_EBX_AVAILABLE || HAVE_EBP_AVAILABLE))
  68. #if ARCH_X86_64 && defined(PIC)
  69. # define BROKEN_RELOCATIONS 1
  70. #endif
  71. /*
  72. * If gcc is not set to support sse (-msse) it will not accept xmm registers
  73. * in the clobber list for inline asm. XMM_CLOBBERS takes a list of xmm
  74. * registers to be marked as clobbered and evaluates to nothing if they are
  75. * not supported, or to the list itself if they are supported. Since a clobber
  76. * list may not be empty, XMM_CLOBBERS_ONLY should be used if the xmm
  77. * registers are the only in the clobber list.
  78. * For example a list with "eax" and "xmm0" as clobbers should become:
  79. * : XMM_CLOBBERS("xmm0",) "eax"
  80. * and a list with only "xmm0" should become:
  81. * XMM_CLOBBERS_ONLY("xmm0")
  82. */
  83. #if HAVE_XMM_CLOBBERS
  84. # define XMM_CLOBBERS(...) __VA_ARGS__
  85. # define XMM_CLOBBERS_ONLY(...) : __VA_ARGS__
  86. #else
  87. # define XMM_CLOBBERS(...)
  88. # define XMM_CLOBBERS_ONLY(...)
  89. #endif
  90. /* Use to export labels from asm. */
  91. #define LABEL_MANGLE(a) EXTERN_PREFIX #a
  92. // Use rip-relative addressing if compiling PIC code on x86-64.
  93. #if ARCH_X86_64 && defined(PIC)
  94. # define LOCAL_MANGLE(a) #a "(%%rip)"
  95. #else
  96. # define LOCAL_MANGLE(a) #a
  97. #endif
  98. #if HAVE_INLINE_ASM_DIRECT_SYMBOL_REFS
  99. # define MANGLE(a) EXTERN_PREFIX LOCAL_MANGLE(a)
  100. # define NAMED_CONSTRAINTS_ADD(...)
  101. # define NAMED_CONSTRAINTS(...)
  102. # define NAMED_CONSTRAINTS_ARRAY_ADD(...)
  103. # define NAMED_CONSTRAINTS_ARRAY(...)
  104. #else
  105. /* When direct symbol references are used in code passed to a compiler that does not support them
  106. * then these references need to be converted to named asm constraints instead.
  107. * Instead of returning a direct symbol MANGLE now returns a named constraint for that specific symbol.
  108. * In order for this to work there must also be a corresponding entry in the asm-interface. To add this
  109. * entry use the macro NAMED_CONSTRAINTS() and pass in a list of each symbol reference used in the
  110. * corresponding block of code. (e.g. NAMED_CONSTRAINTS(var1,var2,var3) where var1 is the first symbol etc. ).
  111. * If there are already existing constraints then use NAMED_CONSTRAINTS_ADD to add to the existing constraint list.
  112. */
  113. # define MANGLE(a) "%["#a"]"
  114. // Intel/MSVC does not correctly expand va-args so we need a rather ugly hack in order to get it to work
  115. # define FE_0(P,X) P(X)
  116. # define FE_1(P,X,X1) P(X), FE_0(P,X1)
  117. # define FE_2(P,X,X1,X2) P(X), FE_1(P,X1,X2)
  118. # define FE_3(P,X,X1,X2,X3) P(X), FE_2(P,X1,X2,X3)
  119. # define FE_4(P,X,X1,X2,X3,X4) P(X), FE_3(P,X1,X2,X3,X4)
  120. # define FE_5(P,X,X1,X2,X3,X4,X5) P(X), FE_4(P,X1,X2,X3,X4,X5)
  121. # define FE_6(P,X,X1,X2,X3,X4,X5,X6) P(X), FE_5(P,X1,X2,X3,X4,X5,X6)
  122. # define FE_7(P,X,X1,X2,X3,X4,X5,X6,X7) P(X), FE_6(P,X1,X2,X3,X4,X5,X6,X7)
  123. # define FE_8(P,X,X1,X2,X3,X4,X5,X6,X7,X8) P(X), FE_7(P,X1,X2,X3,X4,X5,X6,X7,X8)
  124. # define FE_9(P,X,X1,X2,X3,X4,X5,X6,X7,X8,X9) P(X), FE_8(P,X1,X2,X3,X4,X5,X6,X7,X8,X9)
  125. # define GET_FE_IMPL(_0,_1,_2,_3,_4,_5,_6,_7,_8,_9,NAME,...) NAME
  126. # define GET_FE(A) GET_FE_IMPL A
  127. # define GET_FE_GLUE(x, y) x y
  128. # define FOR_EACH_VA(P,...) GET_FE_GLUE(GET_FE((__VA_ARGS__,FE_9,FE_8,FE_7,FE_6,FE_5,FE_4,FE_3,FE_2,FE_1,FE_0)), (P,__VA_ARGS__))
  129. # define NAME_CONSTRAINT(x) [x] "m"(x)
  130. // Parameters are a list of each symbol reference required
  131. # define NAMED_CONSTRAINTS_ADD(...) , FOR_EACH_VA(NAME_CONSTRAINT,__VA_ARGS__)
  132. // Same but without comma for when there are no previously defined constraints
  133. # define NAMED_CONSTRAINTS(...) FOR_EACH_VA(NAME_CONSTRAINT,__VA_ARGS__)
  134. // Same as above NAMED_CONSTRAINTS except used for passing arrays/pointers instead of normal variables
  135. # define NAME_CONSTRAINT_ARRAY(x) [x] "m"(*x)
  136. # define NAMED_CONSTRAINTS_ARRAY_ADD(...) , FOR_EACH_VA(NAME_CONSTRAINT_ARRAY,__VA_ARGS__)
  137. # define NAMED_CONSTRAINTS_ARRAY(...) FOR_EACH_VA(NAME_CONSTRAINT_ARRAY,__VA_ARGS__)
  138. #endif
  139. #endif /* AVUTIL_X86_ASM_H */