Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Implement _layout_ on ctypes structs #1937

Open
wants to merge 1 commit into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
36 changes: 28 additions & 8 deletions src/core/IronPython.Modules/_ctypes/StructType.cs
Original file line number Diff line number Diff line change
Expand Up @@ -33,6 +33,9 @@ public static partial class CTypes {
/// </summary>
[PythonType, PythonHidden]
public class StructType : PythonType, INativeType {

private enum LayoutKind { Msvc, Gcc }

[DisallowNull]
internal Field[]? _fields; // not null after type construction completes
private int? _size, _alignment, _pack;
Expand Down Expand Up @@ -252,6 +255,7 @@ internal static PythonType MakeSystemType(Type underlyingSystemType) {
return PythonType.SetPythonType(underlyingSystemType, new StructType(underlyingSystemType));
}


[MemberNotNull(nameof(_fields), nameof(_size), nameof(_alignment))]
private void SetFields(object? fields) {
lock (this) {
Expand All @@ -263,11 +267,12 @@ private void SetFields(object? fields) {
List<Field> allFields = GetBaseSizeAlignmentAndFields(out int size, out int alignment);

IList<string>? anonFields = GetAnonymousFields(this);
LayoutKind layout = GetStructLayout(this);

foreach (object fieldDef in fieldDefList) {
GetFieldInfo(this, fieldDef, out string fieldName, out INativeType cdata, out bitCount);

int fieldOffset = UpdateSizeAndAlignment(cdata, bitCount, ref lastType, ref size, ref alignment, ref curBitCount);
int fieldOffset = UpdateSizeAndAlignment(cdata, bitCount, layout, ref lastType, ref size, ref alignment, ref curBitCount);

var newField = new Field(fieldName, cdata, fieldOffset, allFields.Count, bitCount, curBitCount - bitCount);
allFields.Add(newField);
Expand All @@ -292,6 +297,7 @@ private void SetFields(object? fields) {
}
}


internal static void CheckAnonymousFields(List<Field> allFields, IList<string>? anonFields) {
if (anonFields != null) {
foreach (string s in anonFields) {
Expand Down Expand Up @@ -365,9 +371,10 @@ private List<Field> GetBaseSizeAlignmentAndFields(out int size, out int alignmen
foreach (PythonType pt in BaseTypes) {
if (pt is StructType st) {
st.EnsureFinal();
LayoutKind layout = GetStructLayout(st);
foreach (Field f in st._fields) {
allFields.Add(f);
UpdateSizeAndAlignment(f.NativeType, f.BitCount, ref lastType, ref size, ref alignment, ref totalBitCount);
UpdateSizeAndAlignment(f.NativeType, f.BitCount, layout, ref lastType, ref size, ref alignment, ref totalBitCount);

if (f.NativeType == this) {
throw StructureCannotContainSelf();
Expand Down Expand Up @@ -404,7 +411,7 @@ private List<Field> GetBaseSizeAlignmentAndFields(out int size, out int alignmen
/// On return, the count is updated with the number of occupied bits.</param>
/// <returns>
/// The offset of the processed field within the struct. If the processed field was a bitfield, this is the offset of its container unit.</returns>
private int UpdateSizeAndAlignment(INativeType cdata, int? bitCount, ref INativeType? lastType, ref int size, ref int alignment, ref int? totalBitCount) {
private int UpdateSizeAndAlignment(INativeType cdata, int? bitCount, LayoutKind layout, ref INativeType? lastType, ref int size, ref int alignment, ref int? totalBitCount) {
int fieldOffset;
if (bitCount != null) {
// process a bitfield
Expand All @@ -413,7 +420,7 @@ private int UpdateSizeAndAlignment(INativeType cdata, int? bitCount, ref INative

if (_pack != null) throw new NotImplementedException("pack with bitfields"); // TODO: implement

if (UseMsvcBitfieldAlignmentRules) {
if (layout is LayoutKind.Msvc) {
if (totalBitCount != null) { // there is already a bitfield container open
// under the MSVC rules, only bitfields of type that has the same size/alignment, are packed into the same container unit
if (lastType!.Size != cdata.Size || lastType.Alignment != cdata.Alignment) {
Expand Down Expand Up @@ -443,7 +450,7 @@ private int UpdateSizeAndAlignment(INativeType cdata, int? bitCount, ref INative
totalBitCount = bitCount;
lastType = cdata;
}
} else { // GCC bitfield alignment rules
} else if (layout is LayoutKind.Gcc) {
// under the GCC rules, all bitfields are packed into the same container unit or an overlapping container unit of a different type,
// as long as they fit and match the alignment
int containerOffset = AlignBack(size, cdata.Alignment); // TODO: _pack
Expand All @@ -460,6 +467,8 @@ private int UpdateSizeAndAlignment(INativeType cdata, int? bitCount, ref INative
fieldOffset = size = containerOffset;
totalBitCount = containerBitCount + bitCount;
lastType = cdata;
} else {
throw new InvalidOperationException("unknown layout kind");
}
alignment = Math.Max(alignment, lastType!.Alignment); // TODO: _pack
} else {
Expand Down Expand Up @@ -500,6 +509,20 @@ internal void EnsureFinal() {
}
}


private static LayoutKind GetStructLayout(PythonType type) {
if (type.TryGetBoundAttr(type.Context.SharedContext, type, "_layout_", out object layout) && layout is not null) {
if (Converter.TryConvertToString(layout, out string? layoutName)) {
if (layoutName.StartsWith("ms", StringComparison.Ordinal)) return LayoutKind.Msvc;
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Any reason for using StartsWith instead of an exact check? The current 3.14 doc seems to say it should either be ms or gcc-sysv.

Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

My reason was that 3.14 is still in alpha and I find the current choice somewhat unfortunate, so I wouldn't be surprised if it changes before the release. In all places I've seen the layouts are called the MSVC layout and the GCC layout (sometimes GCC/Clang layout). Additionally, in the first few weeks working on layout I kept forgetting the string gcc-sysv. I remembered that it was gcc- plus some OS name, but was it gcc-aix? gcc-hpux? etc... I bet that in a year I'll forget again... 👴

I think I can guess why the names were chosen as they are, but it does not convince me these were the best choices. If it were up to me, I would use msvc for the MSVC layout, and for the GCC/Linux layout gcc, with aliases clang and gcc-sysv for the latter. Perhaps an alias ms for the former, if you insist.

I don't know the CPython's development process, perhaps there is some sort of a review of new features before the beta is released, so maybe the names will be changed. I suppose once 3.14b1 is released, the names will be baked in for good. The more relaxed check is in place in case I don't have time (or forget) to come back and fix it in IronPython to whatever the beta will have.

if (layoutName.StartsWith("gcc", StringComparison.Ordinal)) return LayoutKind.Gcc;
}
throw PythonOps.ValueError("unknown _layout_: {0}", layout);
}
// default layout for structs is platform dependent
return RuntimeInformation.IsOSPlatform(OSPlatform.Windows) ? LayoutKind.Msvc : LayoutKind.Gcc;
}


/// <summary>
/// If our size/alignment hasn't been initialized then grabs the size/alignment
/// from all of our base classes. If later new _fields_ are added we'll be
Expand All @@ -525,9 +548,6 @@ private void EnsureSizeAndAlignment() {

private static int AlignBack(int length, int size)
=> length & ~(size - 1);

private static bool UseMsvcBitfieldAlignmentRules
=> RuntimeInformation.IsOSPlatform(OSPlatform.Windows);
}
}
}
Expand Down
53 changes: 51 additions & 2 deletions tests/suite/modules/type_related/test_ctypes.py
Original file line number Diff line number Diff line change
Expand Up @@ -507,12 +507,12 @@ class Test(Structure):
]

self.check_bitfield(Test.a, c_longlong, 0, 0, 20)
if is_posix and (is_cli or sys.version_info < (3, 14)): # CPython 3.14 implements MSVC behaviour (bug)
if is_posix and (is_cli or sys.version_info < (3, 14)): # CPython 3.14 implements MSVC behaviour when _layout_ is not set
if is_cli: # GCC-compliant results
self.check_bitfield(Test.b, c_short, 2, 4, 2)
self.check_bitfield(Test.c, c_short, 2, 6, 15)
self.assertEqual(sizeof(Test), 5)
else: # bug in CPython
else: # https://github.com/python/cpython/issues/131747
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Just a quick note on your CPython bug report, the current dev doc does say that it defaults to ms when _pack_ is specified.

Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Yes, so it is a "documented bug" as I see it, and technically python/cpython#131747 is probably a feature request, one that was not practical before 3.14 started to support _layout_. The reason why IronPython diverges here from CPython is because CPython currently does not support #pragma pack with the GCC layout under any circumstances — at least not yet, and I do not see it on the roadmap. I read from the python/cpython#131747 (comment) by @encukou is that there are plans to overhaul the the whole _layout_ syntax to something more flexible and extensible, but it is at this point not fleshed out yet.

OTOH for IronPython, as the next steps, I intended to implement the GCC layout for bitfields in a GCC-compliant way. Following CPython's documented behaviour literally would mean that to get the default GCC behaviour with bitfields on Linux you would have to set _layout_ = 'gcc-sysv', lest you be silently served the MSVC layout. So you would have to be explicit in Python to get the GCC default, and the default in Python is something rarely used in GCC... 😵‍💫

Just to be clear, this PR does not bring GCC packed layout with bitfields yet — it's just the tests, which are currently being skipped. Implementing GCC packing with bitfields turned out to be surprisingly cumbersome, as GCC can lay the fields out in such a way that to access them requires more data than the total size of the underlying data type used. E.g. as I currently understand it, to access a bitfield of length 57 defined on c_longlong (normally 64 bit), may require reading and processing 9 bytes. This can be done but will require a significant rework of the current code logic, and, frankly, I feel that I'd rather spend my effort on other things, hence no promises.

self.check_bitfield(Test.b, c_short, 6, 20, 2)
self.check_bitfield(Test.c, c_short, 6, 22, 15)
self.assertEqual(sizeof(Test), 8)
Expand Down Expand Up @@ -905,6 +905,55 @@ class Test(Structure):
self.assertEqual(sizeof(Test), 16)


@unittest.skipUnless(is_cli or sys.version_info >= (3, 14), '_layout_ not supported before CPython 3.14')
def test_bitfield_mixed_H3_layout_msvc(self):
class Test(Structure):
_layout_ = 'ms'
_fields_ = [
("a", c_longlong, 52),
("b", c_byte, 5),
]

self.check_bitfield(Test.a, c_longlong, 0, 0, 52)
self.check_bitfield(Test.b, c_byte, 8, 0, 5)
self.assertEqual(sizeof(Test), 16)


@unittest.skipUnless(is_cli or sys.version_info >= (3, 14), '_layout_ not supported before CPython 3.14')
def test_bitfield_mixed_H3_layout_gcc(self):
class Test(Structure):
_layout_ = 'gcc-sysv'
_fields_ = [
("a", c_longlong, 52),
("b", c_byte, 5),
]

self.check_bitfield(Test.a, c_longlong, 0, 0, 52)
self.check_bitfield(Test.b, c_byte, 7, 0, 5)
self.assertEqual(sizeof(Test), 8)


@unittest.skipUnless(is_cli or sys.version_info >= (3, 14), '_layout_ not supported before CPython 3.14')
def test_bitfield_mixed_H3_layout_default(self):
class Test(Structure):
_layout_ = None
_fields_ = [
("a", c_longlong, 52),
("b", c_byte, 5),
]
self.assertEqual(sizeof(Test), 8 if is_posix else 16)


@unittest.skipUnless(is_cli or sys.version_info >= (3, 14), '_layout_ not supported before CPython 3.14')
def test_bitfield_mixed_H3_layout_invalid(self):
with self.assertRaises(ValueError) as context:
class Test(Structure):
_layout_ = "invalid"
_fields_ = []

self.assertIn("unknown _layout_", str(context.exception))


@unittest.skipIf(is_posix, 'Windows specific test')
def test_loadlibrary_error(self):
with self.assertRaises(OSError) as cm:
Expand Down