diff --git a/llvm/lib/MC/MCParser/MasmParser.cpp b/llvm/lib/MC/MCParser/MasmParser.cpp --- a/llvm/lib/MC/MCParser/MasmParser.cpp +++ b/llvm/lib/MC/MCParser/MasmParser.cpp @@ -128,9 +128,11 @@ struct StructInfo { StringRef Name; bool IsUnion = false; + bool Initializable = true; unsigned Alignment = 0; - unsigned Size = 0; unsigned AlignmentSize = 0; + unsigned NextOffset = 0; + unsigned Size = 0; std::vector Fields; StringMap FieldsByName; @@ -322,7 +324,7 @@ struct FieldInfo { // Offset of the field within the containing STRUCT. - size_t Offset = 0; + unsigned Offset = 0; // Total size of the field (= LengthOf * Type). unsigned SizeOf = 0; @@ -344,11 +346,10 @@ FieldsByName[FieldName.lower()] = Fields.size(); Fields.emplace_back(FT); FieldInfo &Field = Fields.back(); - if (IsUnion) { - Field.Offset = 0; - } else { - Size = llvm::alignTo(Size, std::min(Alignment, FieldAlignmentSize)); - Field.Offset = Size; + Field.Offset = + llvm::alignTo(NextOffset, std::min(Alignment, FieldAlignmentSize)); + if (!IsUnion) { + NextOffset = std::max(NextOffset, Field.Offset); } AlignmentSize = std::max(AlignmentSize, FieldAlignmentSize); return Field; @@ -669,6 +670,7 @@ DK_REAL8, DK_REAL10, DK_ALIGN, + DK_EVEN, DK_ORG, DK_ENDR, DK_EXTERN, @@ -871,8 +873,11 @@ bool parseDirectiveEquate(StringRef IDVal, StringRef Name, DirectiveKind DirKind, SMLoc NameLoc); - bool parseDirectiveOrg(); // ".org" + bool parseDirectiveOrg(); // "org" + + bool emitAlignTo(int64_t Alignment); bool parseDirectiveAlign(); // "align" + bool parseDirectiveEven(); // "even" // ".file", ".line", ".loc", ".stabs" bool parseDirectiveFile(SMLoc DirectiveLoc); @@ -2332,6 +2337,8 @@ return parseDirectiveNestedEnds(); case DK_ALIGN: return parseDirectiveAlign(); + case DK_EVEN: + return parseDirectiveEven(); case DK_ORG: return parseDirectiveOrg(); case DK_EXTERN: @@ -3663,10 +3670,11 @@ Field.SizeOf = Field.Type * IntInfo.Values.size(); Field.LengthOf = IntInfo.Values.size(); - if (Struct.IsUnion) - Struct.Size = std::max(Struct.Size, Field.SizeOf); - else - Struct.Size += Field.SizeOf; + const unsigned FieldEnd = Field.Offset + Field.SizeOf; + if (!Struct.IsUnion) { + Struct.NextOffset = FieldEnd; + } + Struct.Size = std::max(Struct.Size, FieldEnd); return false; } @@ -3869,10 +3877,12 @@ Field.Type = RealInfo.AsIntValues.back().getBitWidth() / 8; Field.LengthOf = RealInfo.AsIntValues.size(); Field.SizeOf = Field.Type * Field.LengthOf; - if (Struct.IsUnion) - Struct.Size = std::max(Struct.Size, Field.SizeOf); - else - Struct.Size += Field.SizeOf; + + const unsigned FieldEnd = Field.Offset + Field.SizeOf; + if (!Struct.IsUnion) { + Struct.NextOffset = FieldEnd; + } + Struct.Size = std::max(Struct.Size, FieldEnd); return false; } @@ -4281,14 +4291,16 @@ const StructFieldInfo &Contents, const StructFieldInfo &Initializer) { for (const auto &Init : Initializer.Initializers) { - emitStructInitializer(Contents.Structure, Init); + if (emitStructInitializer(Contents.Structure, Init)) + return true; } // Default-initialize all remaining values. for (auto It = Contents.Initializers.begin() + Initializer.Initializers.size(); It != Contents.Initializers.end(); ++It) { const auto &Init = *It; - emitStructInitializer(Contents.Structure, Init); + if (emitStructInitializer(Contents.Structure, Init)) + return true; } return false; } @@ -4311,6 +4323,10 @@ bool MasmParser::emitStructInitializer(const StructInfo &Structure, const StructInitializer &Initializer) { + if (!Structure.Initializable) + return Error(getLexer().getLoc(), + "cannot initialize a value of type '" + Structure.Name + + "'; 'org' was used in the type's declaration"); size_t Index = 0, Offset = 0; for (const auto &Init : Initializer.FieldInitializers) { const auto &Field = Structure.Fields[Index++]; @@ -4367,10 +4383,12 @@ Field.LengthOf = StructInfo.Initializers.size(); Field.SizeOf = Field.Type * Field.LengthOf; - if (OwningStruct.IsUnion) - OwningStruct.Size = std::max(OwningStruct.Size, Field.SizeOf); - else - OwningStruct.Size += Field.SizeOf; + + const unsigned FieldEnd = Field.Offset + Field.SizeOf; + if (!OwningStruct.IsUnion) { + OwningStruct.NextOffset = FieldEnd; + } + OwningStruct.Size = std::max(OwningStruct.Size, FieldEnd); return false; } @@ -4529,17 +4547,28 @@ ParentStruct.FieldsByName[FieldByName.getKey()] = FieldByName.getValue() + OldFields; } - if (!ParentStruct.IsUnion) { + + unsigned FirstFieldOffset = 0; + if (!Structure.Fields.empty() && !ParentStruct.IsUnion) { + FirstFieldOffset = llvm::alignTo( + ParentStruct.NextOffset, + std::min(ParentStruct.Alignment, Structure.AlignmentSize)); + } + + if (ParentStruct.IsUnion) { + ParentStruct.Size = std::max(ParentStruct.Size, Structure.Size); + } else { for (auto FieldIter = ParentStruct.Fields.begin() + OldFields; FieldIter != ParentStruct.Fields.end(); ++FieldIter) { - FieldIter->Offset += ParentStruct.Size; + FieldIter->Offset += FirstFieldOffset; } - } - if (ParentStruct.IsUnion) - ParentStruct.Size = std::max(ParentStruct.Size, Structure.Size); - else - ParentStruct.Size += Structure.Size; + const unsigned StructureEnd = FirstFieldOffset + Structure.Size; + if (!ParentStruct.IsUnion) { + ParentStruct.NextOffset = StructureEnd; + } + ParentStruct.Size = std::max(ParentStruct.Size, StructureEnd); + } } else { FieldInfo &Field = ParentStruct.addField(Structure.Name, FT_STRUCT, Structure.AlignmentSize); @@ -4548,10 +4577,11 @@ Field.LengthOf = 1; Field.SizeOf = Structure.Size; - if (ParentStruct.IsUnion) - ParentStruct.Size = std::max(ParentStruct.Size, Field.SizeOf); - else - ParentStruct.Size += Field.SizeOf; + const unsigned StructureEnd = Field.Offset + Field.SizeOf; + if (!ParentStruct.IsUnion) { + ParentStruct.NextOffset = StructureEnd; + } + ParentStruct.Size = std::max(ParentStruct.Size, StructureEnd); StructInfo.Structure = Structure; StructInfo.Initializers.emplace_back(); @@ -4565,22 +4595,66 @@ } /// parseDirectiveOrg -/// ::= .org expression [ , expression ] +/// ::= org expression bool MasmParser::parseDirectiveOrg() { const MCExpr *Offset; SMLoc OffsetLoc = Lexer.getLoc(); if (checkForValidSection() || parseExpression(Offset)) return true; - - // Parse optional fill expression. - int64_t FillExpr = 0; - if (parseOptionalToken(AsmToken::Comma)) - if (parseAbsoluteExpression(FillExpr)) - return addErrorSuffix(" in '.org' directive"); if (parseToken(AsmToken::EndOfStatement)) - return addErrorSuffix(" in '.org' directive"); + return addErrorSuffix(" in 'org' directive"); + + if (StructInProgress.empty()) { + // Not in a struct; change the offset for the next instruction or data + if (checkForValidSection()) + return addErrorSuffix(" in 'org' directive"); + + getStreamer().emitValueToOffset(Offset, 0, OffsetLoc); + } else { + // Offset the next field of this struct + StructInfo &Structure = StructInProgress.back(); + int64_t OffsetRes; + if (!Offset->evaluateAsAbsolute(OffsetRes, getStreamer().getAssemblerPtr())) + return Error(OffsetLoc, + "expected absolute expression in 'org' directive"); + if (OffsetRes < 0) + return Error( + OffsetLoc, + "expected non-negative value in struct's 'org' directive; was " + + std::to_string(OffsetRes)); + Structure.NextOffset = static_cast(OffsetRes); + + // ORG-affected structures cannot be initialized + Structure.Initializable = false; + } + + return false; +} + +bool MasmParser::emitAlignTo(int64_t Alignment) { + if (StructInProgress.empty()) { + // Not in a struct; align the next instruction or data + if (checkForValidSection()) + return true; + + // Check whether we should use optimal code alignment for this align + // directive. + const MCSection *Section = getStreamer().getCurrentSectionOnly(); + assert(Section && "must have section to emit alignment"); + if (Section->UseCodeAlign()) { + getStreamer().emitCodeAlignment(Alignment, /*MaxBytesToEmit=*/0); + } else { + // FIXME: Target specific behavior about how the "extra" bytes are filled. + getStreamer().emitValueToAlignment(Alignment, /*Value=*/0, + /*ValueSize=*/1, + /*MaxBytesToEmit=*/0); + } + } else { + // Align the next field of this struct + StructInfo &Structure = StructInProgress.back(); + Structure.NextOffset = llvm::alignTo(Structure.NextOffset, Alignment); + } - getStreamer().emitValueToOffset(Offset, FillExpr, OffsetLoc); return false; } @@ -4590,8 +4664,6 @@ SMLoc AlignmentLoc = getLexer().getLoc(); int64_t Alignment; - if (checkForValidSection()) - return addErrorSuffix(" in align directive"); // Ignore empty 'align' directives. if (getTok().is(AsmToken::EndOfStatement)) { return Warning(AlignmentLoc, @@ -4602,31 +4674,32 @@ parseToken(AsmToken::EndOfStatement)) return addErrorSuffix(" in align directive"); - // Always emit an alignment here even if we thrown an error. + // Always emit an alignment here even if we throw an error. bool ReturnVal = false; - // Reject alignments that aren't either a power of two or zero, for gas + // Reject alignments that aren't either a power of two or zero, for ML.exe // compatibility. Alignment of zero is silently rounded up to one. if (Alignment == 0) Alignment = 1; if (!isPowerOf2_64(Alignment)) - ReturnVal |= Error(AlignmentLoc, "alignment must be a power of 2"); - - // Check whether we should use optimal code alignment for this align - // directive. - const MCSection *Section = getStreamer().getCurrentSectionOnly(); - assert(Section && "must have section to emit alignment"); - if (Section->UseCodeAlign()) { - getStreamer().emitCodeAlignment(Alignment, /*MaxBytesToEmit=*/0); - } else { - // FIXME: Target specific behavior about how the "extra" bytes are filled. - getStreamer().emitValueToAlignment(Alignment, /*Value=*/0, /*ValueSize=*/1, - /*MaxBytesToEmit=*/0); - } + ReturnVal |= Error(AlignmentLoc, "alignment must be a power of 2; was " + + std::to_string(Alignment)); + + if (emitAlignTo(Alignment)) + ReturnVal |= addErrorSuffix(" in align directive"); return ReturnVal; } +/// parseDirectiveEven +/// ::= even +bool MasmParser::parseDirectiveEven() { + if (parseToken(AsmToken::EndOfStatement) || emitAlignTo(2)) + return addErrorSuffix(" in even directive"); + + return false; +} + /// parseDirectiveFile /// ::= .file filename /// ::= .file number [directory] filename [md5 checksum] [source source-text] @@ -6520,7 +6593,8 @@ DirectiveKindMap["real8"] = DK_REAL8; DirectiveKindMap["real10"] = DK_REAL10; DirectiveKindMap["align"] = DK_ALIGN; - // DirectiveKindMap[".org"] = DK_ORG; + DirectiveKindMap["even"] = DK_EVEN; + DirectiveKindMap["org"] = DK_ORG; DirectiveKindMap["extern"] = DK_EXTERN; DirectiveKindMap["public"] = DK_PUBLIC; // DirectiveKindMap[".comm"] = DK_COMM; diff --git a/llvm/test/tools/llvm-ml/align_directives.asm b/llvm/test/tools/llvm-ml/align_directives.asm new file mode 100644 --- /dev/null +++ b/llvm/test/tools/llvm-ml/align_directives.asm @@ -0,0 +1,116 @@ +; RUN: llvm-ml -filetype=s %s /Fo - | FileCheck %s + +.data + +align_test: +ALIGN 16 +; CHECK-LABEL: align_test: +; CHECK-NEXT: .p2align 4 + +org_test: +ORG 256 +; CHECK-LABEL: org_test: +; CHECK-NEXT: .org 256, 0 + +align_struct STRUCT + BYTE ? + + ALIGN 4 + x BYTE ? + x_succ BYTE ? + BYTE ? + + ALIGN 2 + y BYTE ? + y_succ BYTE ? + + ALIGN 1 + z BYTE ? + + EVEN + q BYTE ? +align_struct ENDS + +struct_align_data ALIGN_STRUCT <101, 102, 103, 104, 105, 106, 107, 108> +; CHECK-LABEL: struct_align_data: +; CHECK-NEXT: .byte 101 +; CHECK-NEXT: .zero 3 +; CHECK-NEXT: .byte 102 +; CHECK-NEXT: .byte 103 +; CHECK-NEXT: .byte 104 +; CHECK-NEXT: .zero 1 +; CHECK-NEXT: .byte 105 +; CHECK-NEXT: .byte 106 +; CHECK-NEXT: .byte 107 +; CHECK-NEXT: .zero 1 +; CHECK-NEXT: .byte 108 + +org_struct STRUCT + x BYTE ? + x_succ BYTE ? + ORG 15 + y BYTE ? + y_succ BYTE ? + ORG 2 + z BYTE ? + z_succ BYTE ? +org_struct ENDS + +.code + +struct_align_test PROC + +x_align_test: + MOV eax, align_struct.x + MOV eax, align_struct.x_succ +; CHECK-LABEL: x_align_test: +; CHECK-NEXT: mov eax, 4 +; CHECK-NEXT: mov eax, 5 + +y_align_test: + MOV eax, align_struct.y + MOV eax, align_struct.y_succ +; CHECK-LABEL: y_align_test: +; CHECK-NEXT: mov eax, 8 +; CHECK-NEXT: mov eax, 9 + +z_align_test: + MOV eax, align_struct.z +; CHECK-LABEL: z_align_test: +; CHECK-NEXT: mov eax, 10 + +q_even_test: + MOV eax, align_struct.q +; CHECK-LABEL: q_even_test: +; CHECK-NEXT: mov eax, 12 + +size_align_test: + MOV eax, SIZEOF(align_struct) +; CHECK-LABEL: size_align_test: +; CHECK-NEXT: mov eax, 13 + + ret +struct_align_test ENDP + +struct_org_test PROC +; CHECK-LABEL: struct_org_test: + +field_positions: + MOV eax, org_struct.x + MOV eax, org_struct.x_succ + MOV eax, org_struct.y + MOV eax, org_struct.y_succ + MOV eax, org_struct.z + MOV eax, org_struct.z_succ +; CHECK-LABEL: field_positions: +; CHECK-NEXT: mov eax, 0 +; CHECK-NEXT: mov eax, 1 +; CHECK-NEXT: mov eax, 15 +; CHECK-NEXT: mov eax, 16 +; CHECK-NEXT: mov eax, 2 +; CHECK-NEXT: mov eax, 3 + + ret +struct_org_test ENDP + +end diff --git a/llvm/test/tools/llvm-ml/align_errors.asm b/llvm/test/tools/llvm-ml/align_errors.asm new file mode 100644 --- /dev/null +++ b/llvm/test/tools/llvm-ml/align_errors.asm @@ -0,0 +1,21 @@ +; RUN: not llvm-ml -filetype=s %s /Fo /dev/null 2>&1 | FileCheck %s --implicit-check-not=error: + +.data +org_struct STRUCT + x BYTE ? + x_succ BYTE ? + ORG 15 + y BYTE ? + y_succ BYTE ? + +; CHECK: :[[# @LINE + 1]]:7: error: expected non-negative value in struct's 'org' directive; was -4 + ORG -4 + + z BYTE ? + z_succ BYTE ? +org_struct ENDS + +; CHECK: :[[# @LINE + 1]]:16: error: cannot initialize a value of type 'org_struct'; 'org' was used in the type's declaration +x org_struct <> + +end