1 files changed, 504 insertions, 0 deletions
diff --git a/src/llvm/atomic/atomic-x86.c b/src/llvm/atomic/atomic-x86.c
new file mode 100644
index 0000000..dc0baf0
--- /dev/null
+++ b/src/llvm/atomic/atomic-x86.c
@@ -0,0 +1,504 @@
+/*
+ * Copyright (C) 2010 Parallel Processing Institute (PPI), Fudan Univ.
+ *  <http://ppi.fudan.edu.cn/system_research_group>
+ *
+ * Authors:
+ *  Zhaoguo Wang    <zgwang@fudan.edu.cn>
+ *  Yufei Chen      <chenyufei@fudan.edu.cn>
+ *  Ran Liu         <naruilone@gmail.com>
+ *  Xi Wu           <wuxi@fudan.edu.cn>
+ *
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2 of the License, or (at your option) any later version.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with this library; if not, see <http://www.gnu.org/licenses/>.
+ */
+
+/* We include this file in op_helper.c */
+
+#include <stdlib.h>
+#include <pthread.h>
+#include <assert.h>
+#include "coremu-atomic.h"
+
+#define EAX (env->regs[R_EAX])
+#define ECX (env->regs[R_ECX])
+#define EDX (env->regs[R_EDX])
+#define EBX (env->regs[R_EBX])
+
+/* These definitions are copied from translate.c */
+#if defined(WORDS_BIGENDIAN)
+#define REG_B_OFFSET (sizeof(target_ulong) - 1)
+#define REG_H_OFFSET (sizeof(target_ulong) - 2)
+#define REG_W_OFFSET (sizeof(target_ulong) - 2)
+#define REG_L_OFFSET (sizeof(target_ulong) - 4)
+#define REG_LH_OFFSET (sizeof(target_ulong) - 8)
+#else
+#define REG_B_OFFSET 0
+#define REG_H_OFFSET 1
+#define REG_W_OFFSET 0
+#define REG_L_OFFSET 0
+#define REG_LH_OFFSET 4
+#endif
+
+#ifdef TARGET_X86_64
+#define X86_64_DEF(...)  __VA_ARGS__
+#else
+#define X86_64_DEF(...)
+#endif
+
+#define REG_LOW_MASK (~(uint64_t)0x0>>32)
+
+/* gen_op instructions */
+/* i386 arith/logic operations */
+enum {
+    OP_ADDL,
+    OP_ORL,
+    OP_ADCL,
+    OP_SBBL,
+    OP_ANDL,
+    OP_SUBL,
+    OP_XORL,
+    OP_CMPL,
+};
+
+/* */
+static target_ulong cm_get_reg_val(CPUX86State *env, int ot, int hregs, int reg)
+{
+    target_ulong val, offset;
+    CPUX86State *env1 = env;
+
+    switch(ot) {
+    case 0:  /* OT_BYTE */
+        if (reg < 4 X86_64_DEF( || reg >= 8 || hregs)) {
+            goto std_case;
+        } else {
+            offset = offsetof(CPUX86State, regs[reg - 4]) + REG_H_OFFSET;
+            val = *(((uint8_t *)env1) + offset);
+        }
+        break;
+    default:
+    std_case:
+        val =  env1->regs[reg];
+        break;
+    }
+
+    return val;
+}
+
+static void cm_set_reg_val(CPUX86State *env, int ot, int hregs, int reg, target_ulong val)
+{
+      target_ulong offset;
+
+      CPUX86State *env1 = env;
+
+      switch(ot) {
+      case 0: /* OT_BYTE */
+          if (reg < 4 X86_64_DEF (|| reg >= 8 || hregs)) {
+              offset = offsetof(CPUX86State, regs[reg]) + REG_B_OFFSET;
+              *(((uint8_t *) env1) + offset) = (uint8_t)val;
+          } else {
+              offset = offsetof(CPUX86State, regs[reg - 4]) + REG_H_OFFSET;
+              *(((uint8_t *) env1) + offset) = (uint8_t)val;
+          }
+          break;
+      case 1: /* OT_WORD */
+          offset = offsetof(CPUX86State, regs[reg]) + REG_W_OFFSET;
+          *((uint16_t *)((uint8_t *)env1 + offset)) = (uint16_t)val;
+          break;
+      case 2: /* OT_LONG */
+          env1->regs[reg] = REG_LOW_MASK & val;
+          break;
+      default:
+      case 3: /* OT_QUAD */
+          env1->regs[reg] = val;
+          break;
+      }
+}
+
+#define LD_b ldub_p
+#define LD_w lduw_p
+#define LD_l ldl_p
+#define LD_q ldq_p
+
+/* Lightweight transactional memory. */
+#define TX(vaddr, type, value, command) \
+    unsigned long __q_addr;                                   \
+    DATA_##type __oldv;                                       \
+    DATA_##type value;                                        \
+                                                              \
+    CM_GET_QEMU_ADDR(env, __q_addr, vaddr);                   \
+    do {                                                      \
+        __oldv = value = LD_##type((DATA_##type *)__q_addr);  \
+        {command;};                                           \
+        mb();                                                 \
+    } while (__oldv != (atomic_compare_exchange##type(        \
+                    (DATA_##type *)__q_addr, __oldv, value)))
+
+/* Atomically emulate INC instruction using CAS1 and memory transaction. */
+
+#define GEN_ATOMIC_INC(type, TYPE) \
+void helper_atomic_inc##type(CPUX86State *env, target_ulong a0, int c) \
+{                                                                      \
+    int eflags_c, eflags;                                              \
+    int cc_op;                                                         \
+                                                                       \
+    /* compute the previous instruction c flags */                     \
+    eflags_c = helper_cc_compute_c(CC_DST, CC_SRC, CC_SRC2, CC_OP);    \
+                                                                       \
+    TX(a0, type, value, {                                              \
+        if (c > 0) {                                                   \
+            value++;                                                   \
+            cc_op = CC_OP_INC##TYPE;                                   \
+        } else {                                                       \
+            value--;                                                   \
+            cc_op = CC_OP_DEC##TYPE;                                   \
+        }                                                              \
+    });                                                                \
+                                                                       \
+    CC_SRC = eflags_c;                                                 \
+    CC_DST = value;                                                    \
+                                                                       \
+    eflags = helper_cc_compute_all(CC_DST, CC_SRC, CC_SRC2, cc_op);    \
+    CC_SRC = eflags;                                                   \
+}                                                                      \
+
+GEN_ATOMIC_INC(b, B);
+GEN_ATOMIC_INC(w, W);
+GEN_ATOMIC_INC(l, L);
+#ifdef TARGET_X86_64
+GEN_ATOMIC_INC(q, Q);
+#endif
+
+#define OT_b 0
+#define OT_w 1
+#define OT_l 2
+#define OT_q 3
+
+#define GEN_ATOMIC_XCHG(type) \
+void helper_xchg##type(CPUX86State *env, target_ulong a0, int reg, \
+                int hreg)                                          \
+{                                                                  \
+    DATA_##type val, out;                                          \
+    unsigned long q_addr;                                          \
+                                                                   \
+    CM_GET_QEMU_ADDR(env, q_addr, a0);                             \
+    val = (DATA_##type)cm_get_reg_val(env, OT_##type, hreg, reg);  \
+    out = atomic_exchange##type((DATA_##type *)q_addr, val);       \
+    mb();                                                          \
+                                                                   \
+    cm_set_reg_val(env, OT_##type, hreg, reg, out);                \
+}
+
+GEN_ATOMIC_XCHG(b);
+GEN_ATOMIC_XCHG(w);
+GEN_ATOMIC_XCHG(l);
+#ifdef TARGET_X86_64
+GEN_ATOMIC_XCHG(q);
+#endif
+
+#define GEN_ATOMIC_OP(type, TYPE) \
+void helper_atomic_op##type(CPUX86State *env, target_ulong a0,      \
+                target_ulong t1, int op)                            \
+{                                                                   \
+    DATA_##type operand;                                            \
+    int eflags_c, eflags;                                           \
+    int cc_op;                                                      \
+                                                                    \
+    /* compute the previous instruction c flags */                  \
+    eflags_c = helper_cc_compute_c(CC_DST, CC_SRC, CC_SRC2, CC_OP); \
+    operand = (DATA_##type)t1;                                      \
+                                                                    \
+    TX(a0, type, value, {                                           \
+        switch(op) {                                                \
+        case OP_ADCL:                                               \
+            value += operand + eflags_c;                            \
+            cc_op = CC_OP_ADD##TYPE + (eflags_c << 2);              \
+            CC_SRC = operand;                                       \
+            break;                                                  \
+        case OP_SBBL:                                               \
+            value = value - operand - eflags_c;                     \
+            cc_op = CC_OP_SUB##TYPE + (eflags_c << 2);              \
+            CC_SRC = operand;                                       \
+            break;                                                  \
+        case OP_ADDL:                                               \
+            value += operand;                                       \
+            cc_op = CC_OP_ADD##TYPE;                                \
+            CC_SRC = operand;                                       \
+            break;                                                  \
+        case OP_SUBL:                                               \
+            value -= operand;                                       \
+            cc_op = CC_OP_SUB##TYPE;                                \
+            CC_SRC = operand;                                       \
+            break;                                                  \
+        default:                                                    \
+        case OP_ANDL:                                               \
+            value &= operand;                                       \
+            cc_op = CC_OP_LOGIC##TYPE;                              \
+            break;                                                  \
+        case OP_ORL:                                                \
+            value |= operand;                                       \
+            cc_op = CC_OP_LOGIC##TYPE;                              \
+            break;                                                  \
+        case OP_XORL:                                               \
+            value ^= operand;                                       \
+            cc_op = CC_OP_LOGIC##TYPE;                              \
+            break;                                                  \
+        case OP_CMPL:                                               \
+            abort();                                                \
+            break;                                                  \
+        }                                                           \
+    });                                                             \
+    CC_DST = value;                                                 \
+    /* successful transaction, compute the eflags */                \
+    eflags = helper_cc_compute_all(CC_DST, CC_SRC, CC_SRC2, cc_op); \
+    CC_SRC = eflags;                                                \
+}
+
+GEN_ATOMIC_OP(b, B);
+GEN_ATOMIC_OP(w, W);
+GEN_ATOMIC_OP(l, L);
+#ifdef TARGET_X86_64
+GEN_ATOMIC_OP(q, Q);
+#endif
+
+/* xadd */
+#define GEN_ATOMIC_XADD(type, TYPE) \
+void helper_atomic_xadd##type(CPUX86State *env, target_ulong a0, \
+                int reg, int hreg)                               \
+{                                                                \
+    DATA_##type operand, oldv;                                   \
+    int eflags;                                                  \
+                                                                 \
+    operand = (DATA_##type)cm_get_reg_val(                       \
+            env, OT_##type, hreg, reg);                          \
+                                                                 \
+    TX(a0, type, newv, {                                         \
+        oldv = newv;                                             \
+        newv += operand;                                         \
+    });                                                          \
+                                                                 \
+    /* transaction successes */                                  \
+    /* xchg the register and compute the eflags */               \
+    cm_set_reg_val(env, OT_##type, hreg, reg, oldv);             \
+    CC_SRC = oldv;                                               \
+    CC_DST = newv;                                               \
+                                                                 \
+    eflags = helper_cc_compute_all(CC_DST, CC_SRC, CC_SRC2,      \
+		    CC_OP_ADD##TYPE);                            \
+    CC_SRC = eflags;                                             \
+}
+
+GEN_ATOMIC_XADD(b, B);
+GEN_ATOMIC_XADD(w, W);
+GEN_ATOMIC_XADD(l, L);
+#ifdef TARGET_X86_64
+GEN_ATOMIC_XADD(q, Q);
+#endif
+
+/* cmpxchg */
+#define GEN_ATOMIC_CMPXCHG(type, TYPE) \
+void helper_atomic_cmpxchg##type(CPUX86State *env, target_ulong a0, \
+                int reg, int hreg)                                  \
+{                                                                   \
+    DATA_##type reg_v, eax_v, res;                                  \
+    int eflags;                                                     \
+    unsigned long q_addr;                                           \
+                                                                    \
+    CM_GET_QEMU_ADDR(env, q_addr, a0);                              \
+    reg_v = (DATA_##type)cm_get_reg_val(env, OT_##type, hreg, reg); \
+    eax_v = (DATA_##type)cm_get_reg_val(env, OT_##type, 0, R_EAX);  \
+                                                                    \
+    res = atomic_compare_exchange##type(                            \
+            (DATA_##type *)q_addr, eax_v, reg_v);                   \
+    mb();                                                           \
+                                                                    \
+    if (res != eax_v)                                               \
+        cm_set_reg_val(env, OT_##type, 0, R_EAX, res);              \
+                                                                    \
+    CC_SRC = res;                                                   \
+    CC_DST = eax_v - res;                                           \
+                                                                    \
+    eflags = helper_cc_compute_all(CC_DST, CC_SRC, CC_SRC2,         \
+		    CC_OP_SUB##TYPE);                               \
+    CC_SRC = eflags;                                                \
+}
+
+GEN_ATOMIC_CMPXCHG(b, B);
+GEN_ATOMIC_CMPXCHG(w, W);
+GEN_ATOMIC_CMPXCHG(l, L);
+#ifdef TARGET_X86_64
+GEN_ATOMIC_CMPXCHG(q, Q);
+#endif
+
+#if defined(_LP64)
+/* cmpxchgb (8, 16) */
+void helper_atomic_cmpxchg8b(CPUX86State *env, target_ulong a0)
+{
+    uint64_t edx_eax, ecx_ebx, res;
+    int eflags;
+    unsigned long q_addr;
+
+    eflags = helper_cc_compute_all(CC_DST, CC_SRC, CC_SRC2, CC_OP);
+    CM_GET_QEMU_ADDR(env, q_addr, a0);
+
+    edx_eax = (((uint64_t)EDX << 32) | (uint32_t)EAX);
+    ecx_ebx = (((uint64_t)ECX << 32) | (uint32_t)EBX);
+
+    res = atomic_compare_exchangeq((uint64_t *)q_addr, edx_eax, ecx_ebx);
+    mb();
+
+    if (res == edx_eax) {
+         eflags |= CC_Z;
+    } else {
+        EDX = (uint32_t)(res >> 32);
+        EAX = (uint32_t)res;
+        eflags &= ~CC_Z;
+    }
+
+    CC_SRC = eflags;
+}
+#else
+void helper_atomic_cmpxchg8b(CPUX86State *env, target_ulong a0)
+{
+    assert("helper_atomic_cmpxchg8b: not supported.\n");
+    exit(0);
+}
+#endif
+
+void helper_atomic_cmpxchg16b(CPUX86State *env, target_ulong a0)
+{
+    uint8_t res;
+    int eflags;
+    unsigned long q_addr;
+
+    eflags = helper_cc_compute_all(CC_DST, CC_SRC, CC_SRC2, CC_OP);
+    CM_GET_QEMU_ADDR(env, q_addr, a0);
+
+    uint64_t old_rax = *(uint64_t *)q_addr;
+    uint64_t old_rdx = *(uint64_t *)(q_addr + 8);
+    res = atomic_compare_exchange16b((uint64_t *)q_addr, EAX, EDX, EBX, ECX);
+    mb();
+
+    if (res) {
+        eflags |= CC_Z;         /* swap success */
+    } else {
+        EDX = old_rdx;
+        EAX = old_rax;
+        eflags &= ~CC_Z;        /* read the old value ! */
+    }
+
+    CC_SRC = eflags;
+}
+
+/* not */
+#define GEN_ATOMIC_NOT(type) \
+void helper_atomic_not##type(CPUX86State *env, \
+                target_ulong a0)               \
+{                                              \
+    TX(a0, type, value, {                      \
+        value = ~value;                        \
+    });                                        \
+}
+
+GEN_ATOMIC_NOT(b);
+GEN_ATOMIC_NOT(w);
+GEN_ATOMIC_NOT(l);
+#ifdef TARGET_X86_64
+GEN_ATOMIC_NOT(q);
+#endif
+
+/* neg */
+#define GEN_ATOMIC_NEG(type, TYPE) \
+void helper_atomic_neg##type(CPUX86State *env,              \
+                target_ulong a0)                            \
+{                                                           \
+    int eflags;                                             \
+                                                            \
+    TX(a0, type, value, {                                   \
+        value = -value;                                     \
+    });                                                     \
+                                                            \
+    /* We should use the old value to compute CC */         \
+    CC_SRC = CC_DST = -value;                               \
+                                                            \
+    eflags = helper_cc_compute_all(CC_DST, CC_SRC, CC_SRC2, \
+		    CC_OP_SUB##TYPE);                       \
+    CC_SRC = eflags;                                        \
+}                                                           \
+
+GEN_ATOMIC_NEG(b, B);
+GEN_ATOMIC_NEG(w, W);
+GEN_ATOMIC_NEG(l, L);
+#ifdef TARGET_X86_64
+GEN_ATOMIC_NEG(q, Q);
+#endif
+
+/* This is only used in BTX instruction, with an additional offset.
+ * Note that, when using register bitoffset, the value can be larger than
+ * operand size - 1 (operand size can be 16/32/64), refer to intel manual 2A
+ * page 3-11. */
+#define TX2(vaddr, type, value, offset, command) \
+    unsigned long __q_addr;                                   \
+    DATA_##type __oldv;                                       \
+    DATA_##type value;                                        \
+                                                              \
+    CM_GET_QEMU_ADDR(env, __q_addr, vaddr);                   \
+    __q_addr += offset >> 3;                                  \
+    do {                                                      \
+        __oldv = value = LD_##type((DATA_##type *)__q_addr);  \
+        {command;};                                           \
+        mb();                                                 \
+    } while (__oldv != (atomic_compare_exchange##type(        \
+                    (DATA_##type *)__q_addr, __oldv, value)))
+
+#define GEN_ATOMIC_BTX(ins, command) \
+void helper_atomic_##ins(CPUX86State *env, target_ulong a0,   \
+                target_ulong offset, int ot)                  \
+{                                                             \
+    uint8_t old_byte;                                         \
+    int eflags;                                               \
+                                                              \
+    TX2(a0, b, value, offset, {                               \
+        old_byte = value;                                     \
+        {command;};                                           \
+    });                                                       \
+                                                              \
+    CC_SRC = (old_byte >> (offset & 0x7));                    \
+    CC_DST = 0;                                               \
+    eflags = helper_cc_compute_all(CC_DST, CC_SRC, CC_SRC2,   \
+		    CC_OP_SARB + ot);                         \
+    CC_SRC = eflags;                                          \
+}
+
+/* bts */
+GEN_ATOMIC_BTX(bts, {
+    value |= (1 << (offset & 0x7));
+});
+/* btr */
+GEN_ATOMIC_BTX(btr, {
+    value &= ~(1 << (offset & 0x7));
+});
+/* btc */
+GEN_ATOMIC_BTX(btc, {
+    value ^= (1 << (offset & 0x7));
+});
+
+/* fence **/
+void helper_fence(CPUX86State *env)
+{
+    mb();
+}
+
+#undef EAX
+#undef ECX
+#undef EDX
+#undef EBX