Skip to content

Commit 646a65d

Browse files
authored
Merge pull request #281 from hameerabbasi/upstream-fix
Upstream SciPy fix and maintenance.
2 parents 9344c0b + 29bae47 commit 646a65d

File tree

5 files changed

+84
-39
lines changed

5 files changed

+84
-39
lines changed

.github/dependabot.yml

+13
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
# Set update schedule for GitHub Actions
2+
# This opens a PR when actions in workflows need an update
3+
4+
version: 2
5+
updates:
6+
- package-ecosystem: "github-actions"
7+
directory: "/"
8+
schedule:
9+
# Check for updates to GitHub Actions every week
10+
interval: "weekly"
11+
commit-message:
12+
prefix: "skip changelog" # So this PR will not be added to release-drafter
13+
include: "scope" # List of the updated dependencies in the commit will be added

.github/workflows/build.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ jobs:
2828
fetch-depth: 0
2929

3030
- name: Build wheels
31-
uses: pypa/cibuildwheel@v2.20.0
31+
uses: pypa/cibuildwheel@v2.22.0
3232
- uses: actions/upload-artifact@v4
3333
with:
3434
name: cibw-wheels-${{ matrix.os }}-${{ strategy.job-index }}
@@ -97,7 +97,7 @@ jobs:
9797
- name: Run clang-format style check for C/C++ code.
9898
uses: jidicula/[email protected]
9999
with:
100-
clang-format-version: '18'
100+
clang-format-version: '19'
101101
check-path: 'src'
102102
- name: Upload coverage to Codecov
103103
uses: codecov/codecov-action@v4

pyproject.toml

+7-1
Original file line numberDiff line numberDiff line change
@@ -73,11 +73,17 @@ disallow_any_unimported = false
7373
build = "{cp3{10..13}-*,pp310-*}"
7474
build-frontend = "build"
7575
free-threaded-support = true
76-
test-command = "pip install -r {project}/requirements/tests.txt && pytest --pyargs uarray"
76+
before-test = "pip install -r {project}/requirements/tests.txt"
77+
test-command = "pytest --pyargs uarray"
7778

7879
[tool.cibuildwheel.macos]
7980
archs = ["universal2"]
8081

82+
[[tool.cibuildwheel.overrides]]
83+
select = "*-macosx_*"
84+
inherit.environment = "append"
85+
environment.MACOSX_DEPLOYMENT_TARGET = "10.13"
86+
8187
[tool.cibuildwheel.config-settings]
8288
"cmake.verbose" = true
8389
"logging.level" = "INFO"

src/CMakeLists.txt

+2-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
cmake_minimum_required(VERSION 3.15...3.30)
2+
23
project(${SKBUILD_PROJECT_NAME} LANGUAGES CXX)
34

45
find_package(Python COMPONENTS Interpreter Development.Module REQUIRED)
@@ -9,5 +10,5 @@ Python_add_library(_uarray MODULE
910
vectorcall.cxx
1011
_uarray_dispatch.cxx
1112
WITH_SOABI)
12-
set_property(TARGET _uarray PROPERTY CXX_STANDARD 11)
13+
set_property(TARGET _uarray PROPERTY CXX_STANDARD 17)
1314
install(TARGETS _uarray LIBRARY DESTINATION uarray)

src/_uarray_dispatch.cxx

+60-35
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
1+
#include <Python.h>
2+
13
#include "small_dynamic_array.h"
24
#include "vectorcall.h"
35

4-
#include <Python.h>
5-
66
#include <algorithm>
77
#include <cstddef>
88
#include <new>
@@ -15,6 +15,31 @@
1515

1616
namespace {
1717

18+
template <typename T>
19+
class immortal {
20+
alignas(T) std::byte storage[sizeof(T)];
21+
22+
public:
23+
template <typename... Args>
24+
immortal(Args &&... args) {
25+
// Construct new T in storage
26+
new (&storage) T(std::forward<Args>(args)...);
27+
}
28+
~immortal() {
29+
// Intentionally don't call destructor
30+
}
31+
32+
T * get() { return reinterpret_cast<T *>(&storage); }
33+
const T * get() const { return reinterpret_cast<const T *>(&storage); }
34+
const T * get_const() const { return reinterpret_cast<const T *>(&storage); }
35+
36+
const T * operator->() const { return get(); }
37+
T * operator->() { return get(); }
38+
39+
T & operator*() { return *get(); }
40+
const T & operator*() const { return *get(); }
41+
};
42+
1843
/** Handle to a python object that automatically DECREFs */
1944
class py_ref {
2045
explicit py_ref(PyObject * object): obj_(object) {}
@@ -129,8 +154,8 @@ using global_state_t = std::unordered_map<std::string, global_backends>;
129154
using local_state_t = std::unordered_map<std::string, local_backends>;
130155

131156
static py_ref BackendNotImplementedError;
132-
static global_state_t global_domain_map;
133-
thread_local global_state_t * current_global_state = &global_domain_map;
157+
static immortal<global_state_t> global_domain_map;
158+
thread_local global_state_t * current_global_state = global_domain_map.get();
134159
thread_local global_state_t thread_local_domain_map;
135160
thread_local local_state_t local_domain_map;
136161

@@ -140,30 +165,30 @@ Using these with PyObject_GetAttr is faster than PyObject_GetAttrString which
140165
has to create a new python string internally.
141166
*/
142167
struct {
143-
py_ref ua_convert;
144-
py_ref ua_domain;
145-
py_ref ua_function;
168+
immortal<py_ref> ua_convert;
169+
immortal<py_ref> ua_domain;
170+
immortal<py_ref> ua_function;
146171

147172
bool init() {
148-
ua_convert = py_ref::steal(PyUnicode_InternFromString("__ua_convert__"));
149-
if (!ua_convert)
173+
*ua_convert = py_ref::steal(PyUnicode_InternFromString("__ua_convert__"));
174+
if (!*ua_convert)
150175
return false;
151176

152-
ua_domain = py_ref::steal(PyUnicode_InternFromString("__ua_domain__"));
153-
if (!ua_domain)
177+
*ua_domain = py_ref::steal(PyUnicode_InternFromString("__ua_domain__"));
178+
if (!*ua_domain)
154179
return false;
155180

156-
ua_function = py_ref::steal(PyUnicode_InternFromString("__ua_function__"));
157-
if (!ua_function)
181+
*ua_function = py_ref::steal(PyUnicode_InternFromString("__ua_function__"));
182+
if (!*ua_function)
158183
return false;
159184

160185
return true;
161186
}
162187

163188
void clear() {
164-
ua_convert.reset();
165-
ua_domain.reset();
166-
ua_function.reset();
189+
ua_convert->reset();
190+
ua_domain->reset();
191+
ua_function->reset();
167192
}
168193
} identifiers;
169194

@@ -202,7 +227,7 @@ std::string domain_to_string(PyObject * domain) {
202227

203228
Py_ssize_t backend_get_num_domains(PyObject * backend) {
204229
auto domain =
205-
py_ref::steal(PyObject_GetAttr(backend, identifiers.ua_domain.get()));
230+
py_ref::steal(PyObject_GetAttr(backend, identifiers.ua_domain->get()));
206231
if (!domain)
207232
return -1;
208233

@@ -225,7 +250,7 @@ enum class LoopReturn { Continue, Break, Error };
225250
template <typename Func>
226251
LoopReturn backend_for_each_domain(PyObject * backend, Func f) {
227252
auto domain =
228-
py_ref::steal(PyObject_GetAttr(backend, identifiers.ua_domain.get()));
253+
py_ref::steal(PyObject_GetAttr(backend, identifiers.ua_domain->get()));
229254
if (!domain)
230255
return LoopReturn::Error;
231256

@@ -537,7 +562,7 @@ struct BackendState {
537562

538563
/** Clean up global python references when the module is finalized. */
539564
void globals_free(void * /* self */) {
540-
global_domain_map.clear();
565+
global_domain_map->clear();
541566
BackendNotImplementedError.reset();
542567
identifiers.clear();
543568
}
@@ -550,7 +575,7 @@ void globals_free(void * /* self */) {
550575
* cleanup.
551576
*/
552577
int globals_traverse(PyObject * self, visitproc visit, void * arg) {
553-
for (const auto & kv : global_domain_map) {
578+
for (const auto & kv : *global_domain_map) {
554579
const auto & globals = kv.second;
555580
PyObject * backend = globals.global.backend.get();
556581
Py_VISIT(backend);
@@ -563,7 +588,7 @@ int globals_traverse(PyObject * self, visitproc visit, void * arg) {
563588
}
564589

565590
int globals_clear(PyObject * /* self */) {
566-
global_domain_map.clear();
591+
global_domain_map->clear();
567592
return 0;
568593
}
569594

@@ -1170,7 +1195,8 @@ py_ref Function::canonicalize_kwargs(PyObject * kwargs) {
11701195

11711196
py_func_args Function::replace_dispatchables(
11721197
PyObject * backend, PyObject * args, PyObject * kwargs, PyObject * coerce) {
1173-
auto has_ua_convert = PyObject_HasAttr(backend, identifiers.ua_convert.get());
1198+
auto has_ua_convert =
1199+
PyObject_HasAttr(backend, identifiers.ua_convert->get());
11741200
if (!has_ua_convert) {
11751201
return {py_ref::ref(args), py_ref::ref(kwargs)};
11761202
}
@@ -1182,7 +1208,7 @@ py_func_args Function::replace_dispatchables(
11821208

11831209
PyObject * convert_args[] = {backend, dispatchables.get(), coerce};
11841210
auto res = py_ref::steal(Q_PyObject_VectorcallMethod(
1185-
identifiers.ua_convert.get(), convert_args,
1211+
identifiers.ua_convert->get(), convert_args,
11861212
array_size(convert_args) | Q_PY_VECTORCALL_ARGUMENTS_OFFSET, nullptr));
11871213
if (!res) {
11881214
return {};
@@ -1287,7 +1313,7 @@ PyObject * Function::call(PyObject * args_, PyObject * kwargs_) {
12871313
backend, reinterpret_cast<PyObject *>(this), new_args.args.get(),
12881314
new_args.kwargs.get()};
12891315
result = py_ref::steal(Q_PyObject_VectorcallMethod(
1290-
identifiers.ua_function.get(), args,
1316+
identifiers.ua_function->get(), args,
12911317
array_size(args) | Q_PY_VECTORCALL_ARGUMENTS_OFFSET, nullptr));
12921318

12931319
// raise BackendNotImplemeted is equivalent to return NotImplemented
@@ -1499,7 +1525,7 @@ PyObject * get_state(PyObject * /* self */, PyObject * /* args */) {
14991525

15001526
output->locals = local_domain_map;
15011527
output->use_thread_local_globals =
1502-
(current_global_state != &global_domain_map);
1528+
(current_global_state != global_domain_map.get());
15031529
output->globals = *current_global_state;
15041530

15051531
return ref.release();
@@ -1522,8 +1548,8 @@ PyObject * set_state(PyObject * /* self */, PyObject * args) {
15221548
local_domain_map = state->locals;
15231549
bool use_thread_local_globals =
15241550
(!reset_allowed) || state->use_thread_local_globals;
1525-
current_global_state =
1526-
use_thread_local_globals ? &thread_local_domain_map : &global_domain_map;
1551+
current_global_state = use_thread_local_globals ? &thread_local_domain_map
1552+
: global_domain_map.get();
15271553

15281554
if (use_thread_local_globals)
15291555
thread_local_domain_map = state->globals;
@@ -1554,7 +1580,7 @@ PyObject * determine_backend(PyObject * /*self*/, PyObject * args) {
15541580
auto result = for_each_backend_in_domain(
15551581
domain, [&](PyObject * backend, bool coerce_backend) {
15561582
auto has_ua_convert =
1557-
PyObject_HasAttr(backend, identifiers.ua_convert.get());
1583+
PyObject_HasAttr(backend, identifiers.ua_convert->get());
15581584

15591585
if (!has_ua_convert) {
15601586
// If no __ua_convert__, assume it won't accept the type
@@ -1566,7 +1592,7 @@ PyObject * determine_backend(PyObject * /*self*/, PyObject * args) {
15661592
(coerce && coerce_backend) ? Py_True : Py_False};
15671593

15681594
auto res = py_ref::steal(Q_PyObject_VectorcallMethod(
1569-
identifiers.ua_convert.get(), convert_args,
1595+
identifiers.ua_convert->get(), convert_args,
15701596
array_size(convert_args) | Q_PY_VECTORCALL_ARGUMENTS_OFFSET,
15711597
nullptr));
15721598
if (!res) {
@@ -1775,13 +1801,8 @@ PyModuleDef uarray_module = {
17751801

17761802
} // namespace
17771803

1778-
#if defined(WIN32) || defined(_WIN32)
1779-
# define MODULE_EXPORT __declspec(dllexport)
1780-
#else
1781-
# define MODULE_EXPORT __attribute__((visibility("default")))
1782-
#endif
17831804

1784-
extern "C" MODULE_EXPORT PyObject * PyInit__uarray(void) {
1805+
PyMODINIT_FUNC PyInit__uarray(void) {
17851806

17861807
auto m = py_ref::steal(PyModule_Create(&uarray_module));
17871808
if (!m)
@@ -1823,5 +1844,9 @@ extern "C" MODULE_EXPORT PyObject * PyInit__uarray(void) {
18231844
if (!identifiers.init())
18241845
return nullptr;
18251846

1847+
#if Py_GIL_DISABLED
1848+
PyUnstable_Module_SetGIL(m.get(), Py_MOD_GIL_NOT_USED);
1849+
#endif
1850+
18261851
return m.release();
18271852
}

0 commit comments

Comments
 (0)