1
+ #include < Python.h>
2
+
1
3
#include " small_dynamic_array.h"
2
4
#include " vectorcall.h"
3
5
4
- #include < Python.h>
5
-
6
6
#include < algorithm>
7
7
#include < cstddef>
8
8
#include < new>
15
15
16
16
namespace {
17
17
18
+ template <typename T>
19
+ class immortal {
20
+ alignas (T) std::byte storage[sizeof (T)];
21
+
22
+ public:
23
+ template <typename ... Args>
24
+ immortal (Args &&... args) {
25
+ // Construct new T in storage
26
+ new (&storage) T (std::forward<Args>(args)...);
27
+ }
28
+ ~immortal () {
29
+ // Intentionally don't call destructor
30
+ }
31
+
32
+ T * get () { return reinterpret_cast <T *>(&storage); }
33
+ const T * get () const { return reinterpret_cast <const T *>(&storage); }
34
+ const T * get_const () const { return reinterpret_cast <const T *>(&storage); }
35
+
36
+ const T * operator ->() const { return get (); }
37
+ T * operator ->() { return get (); }
38
+
39
+ T & operator *() { return *get (); }
40
+ const T & operator *() const { return *get (); }
41
+ };
42
+
18
43
/* * Handle to a python object that automatically DECREFs */
19
44
class py_ref {
20
45
explicit py_ref (PyObject * object): obj_(object) {}
@@ -129,8 +154,8 @@ using global_state_t = std::unordered_map<std::string, global_backends>;
129
154
using local_state_t = std::unordered_map<std::string, local_backends>;
130
155
131
156
static py_ref BackendNotImplementedError;
132
- static global_state_t global_domain_map;
133
- thread_local global_state_t * current_global_state = & global_domain_map;
157
+ static immortal< global_state_t > global_domain_map;
158
+ thread_local global_state_t * current_global_state = global_domain_map.get() ;
134
159
thread_local global_state_t thread_local_domain_map;
135
160
thread_local local_state_t local_domain_map;
136
161
@@ -140,30 +165,30 @@ Using these with PyObject_GetAttr is faster than PyObject_GetAttrString which
140
165
has to create a new python string internally.
141
166
*/
142
167
struct {
143
- py_ref ua_convert;
144
- py_ref ua_domain;
145
- py_ref ua_function;
168
+ immortal< py_ref> ua_convert;
169
+ immortal< py_ref> ua_domain;
170
+ immortal< py_ref> ua_function;
146
171
147
172
bool init () {
148
- ua_convert = py_ref::steal (PyUnicode_InternFromString (" __ua_convert__" ));
149
- if (!ua_convert)
173
+ * ua_convert = py_ref::steal (PyUnicode_InternFromString (" __ua_convert__" ));
174
+ if (!* ua_convert)
150
175
return false ;
151
176
152
- ua_domain = py_ref::steal (PyUnicode_InternFromString (" __ua_domain__" ));
153
- if (!ua_domain)
177
+ * ua_domain = py_ref::steal (PyUnicode_InternFromString (" __ua_domain__" ));
178
+ if (!* ua_domain)
154
179
return false ;
155
180
156
- ua_function = py_ref::steal (PyUnicode_InternFromString (" __ua_function__" ));
157
- if (!ua_function)
181
+ * ua_function = py_ref::steal (PyUnicode_InternFromString (" __ua_function__" ));
182
+ if (!* ua_function)
158
183
return false ;
159
184
160
185
return true ;
161
186
}
162
187
163
188
void clear () {
164
- ua_convert. reset ();
165
- ua_domain. reset ();
166
- ua_function. reset ();
189
+ ua_convert-> reset ();
190
+ ua_domain-> reset ();
191
+ ua_function-> reset ();
167
192
}
168
193
} identifiers;
169
194
@@ -202,7 +227,7 @@ std::string domain_to_string(PyObject * domain) {
202
227
203
228
Py_ssize_t backend_get_num_domains (PyObject * backend) {
204
229
auto domain =
205
- py_ref::steal (PyObject_GetAttr (backend, identifiers.ua_domain . get ()));
230
+ py_ref::steal (PyObject_GetAttr (backend, identifiers.ua_domain -> get ()));
206
231
if (!domain)
207
232
return -1 ;
208
233
@@ -225,7 +250,7 @@ enum class LoopReturn { Continue, Break, Error };
225
250
template <typename Func>
226
251
LoopReturn backend_for_each_domain (PyObject * backend, Func f) {
227
252
auto domain =
228
- py_ref::steal (PyObject_GetAttr (backend, identifiers.ua_domain . get ()));
253
+ py_ref::steal (PyObject_GetAttr (backend, identifiers.ua_domain -> get ()));
229
254
if (!domain)
230
255
return LoopReturn::Error;
231
256
@@ -537,7 +562,7 @@ struct BackendState {
537
562
538
563
/* * Clean up global python references when the module is finalized. */
539
564
void globals_free (void * /* self */ ) {
540
- global_domain_map. clear ();
565
+ global_domain_map-> clear ();
541
566
BackendNotImplementedError.reset ();
542
567
identifiers.clear ();
543
568
}
@@ -550,7 +575,7 @@ void globals_free(void * /* self */) {
550
575
* cleanup.
551
576
*/
552
577
int globals_traverse (PyObject * self, visitproc visit, void * arg) {
553
- for (const auto & kv : global_domain_map) {
578
+ for (const auto & kv : * global_domain_map) {
554
579
const auto & globals = kv.second ;
555
580
PyObject * backend = globals.global .backend .get ();
556
581
Py_VISIT (backend);
@@ -563,7 +588,7 @@ int globals_traverse(PyObject * self, visitproc visit, void * arg) {
563
588
}
564
589
565
590
int globals_clear (PyObject * /* self */ ) {
566
- global_domain_map. clear ();
591
+ global_domain_map-> clear ();
567
592
return 0 ;
568
593
}
569
594
@@ -1170,7 +1195,8 @@ py_ref Function::canonicalize_kwargs(PyObject * kwargs) {
1170
1195
1171
1196
py_func_args Function::replace_dispatchables (
1172
1197
PyObject * backend, PyObject * args, PyObject * kwargs, PyObject * coerce) {
1173
- auto has_ua_convert = PyObject_HasAttr (backend, identifiers.ua_convert .get ());
1198
+ auto has_ua_convert =
1199
+ PyObject_HasAttr (backend, identifiers.ua_convert ->get ());
1174
1200
if (!has_ua_convert) {
1175
1201
return {py_ref::ref (args), py_ref::ref (kwargs)};
1176
1202
}
@@ -1182,7 +1208,7 @@ py_func_args Function::replace_dispatchables(
1182
1208
1183
1209
PyObject * convert_args[] = {backend, dispatchables.get (), coerce};
1184
1210
auto res = py_ref::steal (Q_PyObject_VectorcallMethod (
1185
- identifiers.ua_convert . get (), convert_args,
1211
+ identifiers.ua_convert -> get (), convert_args,
1186
1212
array_size (convert_args) | Q_PY_VECTORCALL_ARGUMENTS_OFFSET, nullptr ));
1187
1213
if (!res) {
1188
1214
return {};
@@ -1287,7 +1313,7 @@ PyObject * Function::call(PyObject * args_, PyObject * kwargs_) {
1287
1313
backend, reinterpret_cast <PyObject *>(this ), new_args.args .get (),
1288
1314
new_args.kwargs .get ()};
1289
1315
result = py_ref::steal (Q_PyObject_VectorcallMethod (
1290
- identifiers.ua_function . get (), args,
1316
+ identifiers.ua_function -> get (), args,
1291
1317
array_size (args) | Q_PY_VECTORCALL_ARGUMENTS_OFFSET, nullptr ));
1292
1318
1293
1319
// raise BackendNotImplemeted is equivalent to return NotImplemented
@@ -1499,7 +1525,7 @@ PyObject * get_state(PyObject * /* self */, PyObject * /* args */) {
1499
1525
1500
1526
output->locals = local_domain_map;
1501
1527
output->use_thread_local_globals =
1502
- (current_global_state != & global_domain_map);
1528
+ (current_global_state != global_domain_map. get () );
1503
1529
output->globals = *current_global_state;
1504
1530
1505
1531
return ref.release ();
@@ -1522,8 +1548,8 @@ PyObject * set_state(PyObject * /* self */, PyObject * args) {
1522
1548
local_domain_map = state->locals ;
1523
1549
bool use_thread_local_globals =
1524
1550
(!reset_allowed) || state->use_thread_local_globals ;
1525
- current_global_state =
1526
- use_thread_local_globals ? &thread_local_domain_map : & global_domain_map;
1551
+ current_global_state = use_thread_local_globals ? &thread_local_domain_map
1552
+ : global_domain_map. get () ;
1527
1553
1528
1554
if (use_thread_local_globals)
1529
1555
thread_local_domain_map = state->globals ;
@@ -1554,7 +1580,7 @@ PyObject * determine_backend(PyObject * /*self*/, PyObject * args) {
1554
1580
auto result = for_each_backend_in_domain (
1555
1581
domain, [&](PyObject * backend, bool coerce_backend) {
1556
1582
auto has_ua_convert =
1557
- PyObject_HasAttr (backend, identifiers.ua_convert . get ());
1583
+ PyObject_HasAttr (backend, identifiers.ua_convert -> get ());
1558
1584
1559
1585
if (!has_ua_convert) {
1560
1586
// If no __ua_convert__, assume it won't accept the type
@@ -1566,7 +1592,7 @@ PyObject * determine_backend(PyObject * /*self*/, PyObject * args) {
1566
1592
(coerce && coerce_backend) ? Py_True : Py_False};
1567
1593
1568
1594
auto res = py_ref::steal (Q_PyObject_VectorcallMethod (
1569
- identifiers.ua_convert . get (), convert_args,
1595
+ identifiers.ua_convert -> get (), convert_args,
1570
1596
array_size (convert_args) | Q_PY_VECTORCALL_ARGUMENTS_OFFSET,
1571
1597
nullptr ));
1572
1598
if (!res) {
@@ -1775,13 +1801,8 @@ PyModuleDef uarray_module = {
1775
1801
1776
1802
} // namespace
1777
1803
1778
- #if defined(WIN32) || defined(_WIN32)
1779
- # define MODULE_EXPORT __declspec (dllexport)
1780
- #else
1781
- # define MODULE_EXPORT __attribute__ ((visibility(" default" )))
1782
- #endif
1783
1804
1784
- extern " C " MODULE_EXPORT PyObject * PyInit__uarray (void ) {
1805
+ PyMODINIT_FUNC PyInit__uarray (void ) {
1785
1806
1786
1807
auto m = py_ref::steal (PyModule_Create (&uarray_module));
1787
1808
if (!m)
@@ -1823,5 +1844,9 @@ extern "C" MODULE_EXPORT PyObject * PyInit__uarray(void) {
1823
1844
if (!identifiers.init ())
1824
1845
return nullptr ;
1825
1846
1847
+ #if Py_GIL_DISABLED
1848
+ PyUnstable_Module_SetGIL (m.get (), Py_MOD_GIL_NOT_USED);
1849
+ #endif
1850
+
1826
1851
return m.release ();
1827
1852
}
0 commit comments