python
diff --git a/‎Include/Python.h‎
Lines changed: 2 additions & 0 deletions b/‎Include/Python.h‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎Include/dynamic_annotations.h‎
Lines changed: 499 additions & 0 deletions b/‎Include/dynamic_annotations.h‎
Lines changed: 499 additions & 0 deletions
diff --git a/‎Include/pyatomic.h‎
Lines changed: 179 additions & 0 deletions b/‎Include/pyatomic.h‎
Lines changed: 179 additions & 0 deletions
diff --git a/‎Include/pystate.h‎
Lines changed: 5 additions & 2 deletions b/‎Include/pystate.h‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎Makefile.pre.in‎
Lines changed: 4 additions & 0 deletions b/‎Makefile.pre.in‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎Objects/dictobject.c‎
Lines changed: 2 additions & 1 deletion b/‎Objects/dictobject.c‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎PC/VS7.1/pythoncore.vcproj‎
Lines changed: 3 additions & 0 deletions b/‎PC/VS7.1/pythoncore.vcproj‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎PC/VS8.0/pythoncore.vcproj‎
Lines changed: 8 additions & 0 deletions b/‎PC/VS8.0/pythoncore.vcproj‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎PC/os2emx/Makefile‎
Lines changed: 1 addition & 0 deletions b/‎PC/os2emx/Makefile‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎PCbuild/pythoncore.vcproj‎
Lines changed: 8 additions & 0 deletions b/‎PCbuild/pythoncore.vcproj‎
Lines changed: 8 additions & 0 deletions
@@ -49,6 +49,8 @@
 
 #include "pyport.h"
 
+#include "pyatomic.h"
+
 /* Debug-mode build with pymalloc implies PYMALLOC_DEBUG.
  *  PYMALLOC_DEBUG is in error if pymalloc is not in use.
  */
 
@@ -0,0 +1,179 @@
+#ifndef Py_ATOMIC_H
+#define Py_ATOMIC_H
+/* XXX: When compilers start offering a stdatomic.h with lock-free
+   atomic_int and atomic_address types, include that here and rewrite
+   the atomic operations in terms of it. */
+
+#include "dynamic_annotations.h"
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+/* This is modeled after the atomics interface from C1x, according to
+ * the draft at
+ * http://www.open-std.org/JTC1/SC22/wg14/www/docs/n1425.pdf.
+ * Operations and types are named the same except with a _Py_ prefix
+ * and have the same semantics.
+ *
+ * Beware, the implementations here are deep magic.
+ */
+
+typedef enum _Py_memory_order {
+    _Py_memory_order_relaxed,
+    _Py_memory_order_acquire,
+    _Py_memory_order_release,
+    _Py_memory_order_acq_rel,
+    _Py_memory_order_seq_cst
+} _Py_memory_order;
+
+typedef struct _Py_atomic_address {
+    void *_value;
+} _Py_atomic_address;
+
+typedef struct _Py_atomic_int {
+    int _value;
+} _Py_atomic_int;
+
+/* Only support GCC (for expression statements) and x86 (for simple
+ * atomic semantics) for now */
+#if defined(__GNUC__) && (defined(__i386__) || defined(__amd64))
+
+static __inline__ void
+_Py_atomic_signal_fence(_Py_memory_order order)
+{
+    if (order != _Py_memory_order_relaxed)
+        __asm__ volatile("":::"memory");
+}
+
+static __inline__ void
+_Py_atomic_thread_fence(_Py_memory_order order)
+{
+    if (order != _Py_memory_order_relaxed)
+        __asm__ volatile("mfence":::"memory");
+}
+
+/* Tell the race checker about this operation's effects. */
+static __inline__ void
+_Py_ANNOTATE_MEMORY_ORDER(const volatile void *address, _Py_memory_order order)
+{
+    switch(order) {
+    case _Py_memory_order_release:
+    case _Py_memory_order_acq_rel:
+    case _Py_memory_order_seq_cst:
+        _Py_ANNOTATE_HAPPENS_BEFORE(address);
+        break;
+    default:
+        break;
+    }
+    switch(order) {
+    case _Py_memory_order_acquire:
+    case _Py_memory_order_acq_rel:
+    case _Py_memory_order_seq_cst:
+        _Py_ANNOTATE_HAPPENS_AFTER(address);
+        break;
+    default:
+        break;
+    }
+}
+
+#define _Py_atomic_store_explicit(ATOMIC_VAL, NEW_VAL, ORDER) \
+    __extension__ ({ \
+        __typeof__(ATOMIC_VAL) atomic_val = ATOMIC_VAL; \
+        __typeof__(atomic_val->_value) new_val = NEW_VAL;\
+        volatile __typeof__(new_val) *volatile_data = &atomic_val->_value; \
+        _Py_memory_order order = ORDER; \
+        _Py_ANNOTATE_MEMORY_ORDER(atomic_val, order); \
+        \
+        /* Perform the operation. */ \
+        _Py_ANNOTATE_IGNORE_WRITES_BEGIN(); \
+        switch(order) { \
+        case _Py_memory_order_release: \
+            _Py_atomic_signal_fence(_Py_memory_order_release); \
+            /* fallthrough */ \
+        case _Py_memory_order_relaxed: \
+            *volatile_data = new_val; \
+            break; \
+        \
+        case _Py_memory_order_acquire: \
+        case _Py_memory_order_acq_rel: \
+        case _Py_memory_order_seq_cst: \
+            __asm__ volatile("xchg %0, %1" \
+                         : "+r"(new_val) \
+                         : "m"(atomic_val->_value) \
+                         : "memory"); \
+            break; \
+        } \
+        _Py_ANNOTATE_IGNORE_WRITES_END(); \
+    })
+
+#define _Py_atomic_load_explicit(ATOMIC_VAL, ORDER) \
+    __extension__ ({  \
+        __typeof__(ATOMIC_VAL) atomic_val = ATOMIC_VAL; \
+        __typeof__(atomic_val->_value) result; \
+        volatile __typeof__(result) *volatile_data = &atomic_val->_value; \
+        _Py_memory_order order = ORDER; \
+        _Py_ANNOTATE_MEMORY_ORDER(atomic_val, order); \
+        \
+        /* Perform the operation. */ \
+        _Py_ANNOTATE_IGNORE_READS_BEGIN(); \
+        switch(order) { \
+        case _Py_memory_order_release: \
+        case _Py_memory_order_acq_rel: \
+        case _Py_memory_order_seq_cst: \
+            /* Loads on x86 are not releases by default, so need a */ \
+            /* thread fence. */ \
+            _Py_atomic_thread_fence(_Py_memory_order_release); \
+            break; \
+        default: \
+            /* No fence */ \
+            break; \
+        } \
+        result = *volatile_data; \
+        switch(order) { \
+        case _Py_memory_order_acquire: \
+        case _Py_memory_order_acq_rel: \
+        case _Py_memory_order_seq_cst: \
+            /* Loads on x86 are automatically acquire operations so */ \
+            /* can get by with just a compiler fence. */ \
+            _Py_atomic_signal_fence(_Py_memory_order_acquire); \
+            break; \
+        default: \
+            /* No fence */ \
+            break; \
+        } \
+        _Py_ANNOTATE_IGNORE_READS_END(); \
+        result; \
+    })
+
+#else  /* !gcc x86 */
+/* Fall back to other compilers and processors by assuming that simple
+   volatile accesses are atomic.  This is false, so people should port
+   this. */
+#define _Py_atomic_signal_fence(/*memory_order*/ ORDER) ((void)0)
+#define _Py_atomic_thread_fence(/*memory_order*/ ORDER) ((void)0)
+#define _Py_atomic_store_explicit(ATOMIC_VAL, NEW_VAL, ORDER) \
+    ((ATOMIC_VAL)->_value = NEW_VAL)
+#define _Py_atomic_load_explicit(ATOMIC_VAL, ORDER) \
+    ((ATOMIC_VAL)->_value)
+
+#endif  /* !gcc x86 */
+
+/* Standardized shortcuts. */
+#define _Py_atomic_store(ATOMIC_VAL, NEW_VAL) \
+    _Py_atomic_store_explicit(ATOMIC_VAL, NEW_VAL, _Py_memory_order_seq_cst)
+#define _Py_atomic_load(ATOMIC_VAL) \
+    _Py_atomic_load_explicit(ATOMIC_VAL, _Py_memory_order_seq_cst)
+
+/* Python-local extensions */
+
+#define _Py_atomic_store_relaxed(ATOMIC_VAL, NEW_VAL) \
+    _Py_atomic_store_explicit(ATOMIC_VAL, NEW_VAL, _Py_memory_order_relaxed)
+#define _Py_atomic_load_relaxed(ATOMIC_VAL) \
+    _Py_atomic_load_explicit(ATOMIC_VAL, _Py_memory_order_relaxed)
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif  /* Py_ATOMIC_H */
@@ -131,12 +131,15 @@ PyAPI_FUNC(int) PyThreadState_SetAsyncExc(long, PyObject *);
 
 /* Variable and macro for in-line access to current thread state */
 
-PyAPI_DATA(PyThreadState *) _PyThreadState_Current;
+/* Assuming the current thread holds the GIL, this is the
+   PyThreadState for the current thread. */
+PyAPI_DATA(_Py_atomic_address) _PyThreadState_Current;
 
 #ifdef Py_DEBUG
 #define PyThreadState_GET() PyThreadState_Get()
 #else
-#define PyThreadState_GET() (_PyThreadState_Current)
+#define PyThreadState_GET() \
+    ((PyThreadState*)_Py_atomic_load_relaxed(&_PyThreadState_Current))
 #endif
 
 typedef
 
@@ -238,6 +238,7 @@ PARSER_OBJS=	$(POBJS) Parser/myreadline.o Parser/tokenizer.o
 
 PGOBJS=		\
 		Objects/obmalloc.o \
+		Python/dynamic_annotations.o \
 		Python/mysnprintf.o \
 		Python/pyctype.o \
 		Parser/tokenizer_pgen.o \
@@ -283,6 +284,7 @@ PYTHON_OBJS=	\
 		Python/ceval.o \
 		Python/compile.o \
 		Python/codecs.o \
+		Python/dynamic_annotations.o \
 		Python/errors.o \
 		Python/frozen.o \
 		Python/frozenmain.o \
@@ -644,6 +646,7 @@ PYTHON_HEADERS= \
 		Include/descrobject.h \
 		Include/dictobject.h \
 		Include/dtoa.h \
+		Include/dynamic_annotations.h \
 		Include/enumobject.h \
 		Include/errcode.h \
 		Include/eval.h \
@@ -674,6 +677,7 @@ PYTHON_HEADERS= \
 		Include/pgen.h \
 		Include/pgenheaders.h \
 		Include/pyarena.h \
+		Include/pyatomic.h \
 		Include/pycapsule.h \
 		Include/pyctype.h \
 		Include/pydebug.h \
 
@@ -734,7 +734,8 @@ PyDict_GetItem(PyObject *op, PyObject *key)
 	   Let's just hope that no exception occurs then...  This must be
 	   _PyThreadState_Current and not PyThreadState_GET() because in debug
 	   mode, the latter complains if tstate is NULL. */
-	tstate = _PyThreadState_Current;
+	tstate = (PyThreadState*)_Py_atomic_load_relaxed(
+		&_PyThreadState_Current);
 	if (tstate != NULL && tstate->curexc_type != NULL) {
 		/* preserve the existing exception */
 		PyObject *err_type, *err_value, *err_tb;
 
@@ -507,6 +507,9 @@
 		<File
 			RelativePath="..\..\PC\config.c">
 		</File>
+		<File
+			RelativePath="..\..\Python\dynamic_annotations.c">
+		</File>
 		<File
 			RelativePath="..\..\Modules\datetimemodule.c">
 		</File>
 
@@ -706,6 +706,10 @@
 				RelativePath="..\..\Include\dtoa.h"
 				>
 			</File>			
+			<File
+				RelativePath="..\..\Include\dynamic_annotations.h"
+				>
+			</File>
 			<File
 				RelativePath="..\..\Include\enumobject.h"
 				>
@@ -1654,6 +1658,10 @@
 				RelativePath="..\..\Python\compile.c"
 				>
 			</File>
+			<File
+				RelativePath="..\..\Python\dynamic_annotations.c"
+				>
+			</File>
 			<File
 				RelativePath="..\..\Python\dtoa.c"
 				>
 
@@ -332,6 +332,7 @@ SRC.PYTHON=	$(addprefix $(TOP), \
 		Python/ceval.c \
 		Python/compile.c \
 		Python/codecs.c \
+		Python/dynamic_annotations.c \
 		Python/errors.c \
 		Python/frozen.c \
 		Python/frozenmain.c \
 
@@ -702,6 +702,10 @@
 				RelativePath="..\Include\dictobject.h"
 				>
 			</File>
+			<File
+				RelativePath="..\Include\dynamic_annotations.h"
+				>
+			</File>
 			<File
 				RelativePath="..\Include\enumobject.h"
 				>
@@ -1659,6 +1663,10 @@
 				RelativePath="..\Python\compile.c"
 				>
 			</File>
+			<File
+				RelativePath="..\Python\dynamic_annotations.c"
+				>
+			</File>
 			<File
 				RelativePath="..\Python\dynload_win.c"
 				>
Original file line number	Diff line number	Diff line change
`@@ -706,6 +706,10 @@`
`706`	`706`	`RelativePath="..\..\Include\dtoa.h"`
`707`	`707`	`>`
`708`	`708`	`</File>`
	`709`	`+ <File`
	`710`	`+ RelativePath="..\..\Include\dynamic_annotations.h"`
	`711`	`+ >`
	`712`	`+ </File>`
`709`	`713`	`<File`
`710`	`714`	`RelativePath="..\..\Include\enumobject.h"`
`711`	`715`	`>`
`@@ -1654,6 +1658,10 @@`
`1654`	`1658`	`RelativePath="..\..\Python\compile.c"`
`1655`	`1659`	`>`
`1656`	`1660`	`</File>`
	`1661`	`+ <File`
	`1662`	`+ RelativePath="..\..\Python\dynamic_annotations.c"`
	`1663`	`+ >`
	`1664`	`+ </File>`
`1657`	`1665`	`<File`
`1658`	`1666`	`RelativePath="..\..\Python\dtoa.c"`
`1659`	`1667`	`>`
Original file line number	Diff line number	Diff line change
`@@ -702,6 +702,10 @@`
`702`	`702`	`RelativePath="..\Include\dictobject.h"`
`703`	`703`	`>`
`704`	`704`	`</File>`
	`705`	`+ <File`
	`706`	`+ RelativePath="..\Include\dynamic_annotations.h"`
	`707`	`+ >`
	`708`	`+ </File>`
`705`	`709`	`<File`
`706`	`710`	`RelativePath="..\Include\enumobject.h"`
`707`	`711`	`>`
`@@ -1659,6 +1663,10 @@`
`1659`	`1663`	`RelativePath="..\Python\compile.c"`
`1660`	`1664`	`>`
`1661`	`1665`	`</File>`
	`1666`	`+ <File`
	`1667`	`+ RelativePath="..\Python\dynamic_annotations.c"`
	`1668`	`+ >`
	`1669`	`+ </File>`
`1662`	`1670`	`<File`
`1663`	`1671`	`RelativePath="..\Python\dynload_win.c"`
`1664`	`1672`	`>`