apache · olabusayoT · Oct 9, 2024 · Oct 16, 2024 · Oct 29, 2024 · Nov 4, 2024
diff --git a/daffodil-codegen-c/src/main/scala/org/apache/daffodil/codegen/c/DaffodilCCodeGenerator.scala b/daffodil-codegen-c/src/main/scala/org/apache/daffodil/codegen/c/DaffodilCCodeGenerator.scala
@@ -49,7 +49,7 @@ import org.apache.daffodil.core.grammar.primitives.ChoiceCombinator
 import org.apache.daffodil.core.grammar.primitives.ElementCombinator
 import org.apache.daffodil.core.grammar.primitives.ElementParseAndUnspecifiedLength
 import org.apache.daffodil.core.grammar.primitives.ElementUnused
-import org.apache.daffodil.core.grammar.primitives.HexBinaryLengthPrefixed
+import org.apache.daffodil.core.grammar.primitives.HexBinaryEndOfBitLimit
 import org.apache.daffodil.core.grammar.primitives.HexBinarySpecifiedLength
 import org.apache.daffodil.core.grammar.primitives.OrderedSequence
 import org.apache.daffodil.core.grammar.primitives.RepOrderedExactlyNSequenceChild
@@ -59,6 +59,7 @@ import org.apache.daffodil.core.grammar.primitives.RightFill
 import org.apache.daffodil.core.grammar.primitives.ScalarOrderedSequenceChild
 import org.apache.daffodil.core.grammar.primitives.SpecifiedLengthExplicit
 import org.apache.daffodil.core.grammar.primitives.SpecifiedLengthImplicit
+import org.apache.daffodil.core.grammar.primitives.SpecifiedLengthPrefixed
 import org.apache.daffodil.lib.api.Diagnostic
 import org.apache.daffodil.lib.api.WarnID
 import org.apache.daffodil.lib.schema.annotation.props.gen.FailureType
@@ -288,7 +289,8 @@ object DaffodilCCodeGenerator
       case g: ElementParseAndUnspecifiedLength =>
         elementParseAndUnspecifiedLengthGenerateCode(g, cgState)
       case g: ElementUnused => noop(g)
-      case g: HexBinaryLengthPrefixed => hexBinaryLengthPrefixedGenerateCode(g.e, cgState)
+      case g: HexBinaryEndOfBitLimit if g.e.isPrefixed =>
+        hexBinaryLengthPrefixedGenerateCode(g.e, cgState)
       case g: HexBinarySpecifiedLength => hexBinarySpecifiedLengthGenerateCode(g.e, cgState)
       case g: OrderedSequence => orderedSequenceGenerateCode(g, cgState)
       case g: Prod => prod(g, cgState)
@@ -301,6 +303,7 @@ object DaffodilCCodeGenerator
       case g: SeqComp => seqCompGenerateCode(g, cgState)
       case g: SpecifiedLengthExplicit => specifiedLengthExplicit(g, cgState)
       case g: SpecifiedLengthImplicit => specifiedLengthImplicit(g, cgState)
+      case g: SpecifiedLengthPrefixed => specifiedLengthPrefixed(g, cgState)
       case _ => gram.SDE("Code generation not supported for: %s", Misc.getNameFromClass(gram))
     }
   }
@@ -409,4 +412,11 @@ object DaffodilCCodeGenerator
   ): Unit = {
     DaffodilCCodeGenerator.generateCode(g.eGram, cgState)
   }
+
+  private def specifiedLengthPrefixed(
+    g: SpecifiedLengthPrefixed,
+    cgState: CodeGeneratorState
+  ): Unit = {
+    DaffodilCCodeGenerator.generateCode(g.eGram, cgState)
+  }
 }
diff --git a/daffodil-core/src/main/scala/org/apache/daffodil/core/grammar/ElementBaseGrammarMixin.scala b/daffodil-core/src/main/scala/org/apache/daffodil/core/grammar/ElementBaseGrammarMixin.scala
@@ -72,7 +72,9 @@ trait ElementBaseGrammarMixin
     }
   }
 
-  protected lazy val isDelimitedPrefixedPattern = {
+  lazy val isPrefixed: Boolean = lengthKind == LengthKind.Prefixed
+
+  protected lazy val isDelimitedPrefixedPattern: Boolean = {
     import LengthKind._
     lengthKind match {
       case Delimited =>
@@ -474,12 +476,16 @@ trait ElementBaseGrammarMixin
     lazy val leftPadding = leftPaddingArg
     lazy val rightPadFill = rightPadFillArg
     lazy val body = bodyArg
-    CaptureContentLengthStart(this) ~
-      leftPadding ~
-      CaptureValueLengthStart(this) ~
-      body ~
-      CaptureValueLengthEnd(this) ~
-      rightPadFill ~
+    specifiedLength(
+      CaptureContentLengthStart(this) ~
+        leftPadding ~
+        CaptureValueLengthStart(this) ~
+        body ~
+        CaptureValueLengthEnd(this) ~
+        rightPadFill
+    ) ~
+      // CaptureContentLengthEnd must be outside the specified length so it can
+      // do any skipping of bits it needs to before capturing the end of content length
       CaptureContentLengthEnd(this)
   }
 
@@ -623,14 +629,14 @@ trait ElementBaseGrammarMixin
 
   private lazy val stringPrim = {
     lengthKind match {
-      case LengthKind.Explicit => specifiedLength(StringOfSpecifiedLength(this))
-      case LengthKind.Prefixed => specifiedLength(StringOfSpecifiedLength(this))
+      case LengthKind.Explicit => StringOfSpecifiedLength(this)
+      case LengthKind.Prefixed => StringOfSpecifiedLength(this)
       case LengthKind.Delimited => stringDelimitedEndOfData
-      case LengthKind.Pattern => specifiedLength(StringOfSpecifiedLength(this))
+      case LengthKind.Pattern => StringOfSpecifiedLength(this)
       case LengthKind.Implicit => {
         val pt = this.simpleType.primType
         Assert.invariant(pt == PrimType.String)
-        specifiedLength(StringOfSpecifiedLength(this))
+        StringOfSpecifiedLength(this)
       }
       case LengthKind.EndOfParent if isComplexType =>
         notYetImplemented("lengthKind='endOfParent' for complex type")
@@ -645,11 +651,11 @@ trait ElementBaseGrammarMixin
   }
 
   private lazy val hexBinaryLengthPattern = prod("hexBinaryLengthPattern") {
-    new SpecifiedLengthPattern(this, new HexBinaryEndOfBitLimit(this))
+    new HexBinaryEndOfBitLimit(this)
   }
 
   private lazy val hexBinaryLengthPrefixed = prod("hexBinaryLengthPrefixed") {
-    new HexBinaryLengthPrefixed(this)
+    new HexBinaryEndOfBitLimit(this)
   }
 
   private lazy val hexBinaryValue = prod("hexBinaryValue") {
@@ -1226,7 +1232,7 @@ trait ElementBaseGrammarMixin
   }
 
   private lazy val nilLitSimple = prod("nilLitSimple", isSimpleType) {
-    captureLengthRegions(leftPadding, specifiedLength(nilLitContent), rightPadding ~ rightFill)
+    captureLengthRegions(leftPadding, nilLitContent, rightPadding ~ rightFill)
   }
 
   private lazy val nilLitComplex = prod("nilLitComplex", isComplexType) {
@@ -1329,7 +1335,10 @@ trait ElementBaseGrammarMixin
    * as well, by not enclosing the body in a specified length enforcer.
    */
   private def specifiedLength(bodyArg: => Gram) = {
-    lazy val body = bodyArg
+    // we need this to evaluate before we wrap in specified length parser,
+    // so it can do any internal checks for example blobValue's check for
+    // non-explicit lengthKind
+    val body = bodyArg
     lazy val bitsMultiplier = lengthUnits match {
       case LengthUnits.Bits => 1
       case LengthUnits.Bytes => 8
@@ -1341,7 +1350,13 @@ trait ElementBaseGrammarMixin
       case LengthKind.Delimited => body
       case LengthKind.Pattern => new SpecifiedLengthPattern(this, body)
       case LengthKind.Explicit if bitsMultiplier != 0 =>
-        new SpecifiedLengthExplicit(this, body, bitsMultiplier)
+        if (isSimpleType && primType == PrimType.HexBinary) {
+          // hexBinary has some checks that need to be done that SpecifiedLengthExplicit
+          // gets in the way of
+          body
+        } else {
+          new SpecifiedLengthExplicit(this, body, bitsMultiplier)
+        }
       case LengthKind.Explicit => {
         Assert.invariant(!knownEncodingIsFixedWidth)
         Assert.invariant(lengthUnits eq LengthUnits.Characters)
@@ -1366,14 +1381,15 @@ trait ElementBaseGrammarMixin
       }
       case LengthKind.Implicit if isSimpleType && primType == PrimType.String =>
         new SpecifiedLengthImplicitCharacters(this, body, this.maxLength.longValue)
-
-      case LengthKind.Implicit if isSimpleType && primType == PrimType.HexBinary =>
-        new SpecifiedLengthImplicit(this, body, this.maxLength.longValue * bitsMultiplier)
       case LengthKind.Implicit
-          if isSimpleType && impliedRepresentation == Representation.Binary =>
+          if isSimpleType &&
+            impliedRepresentation == Representation.Binary &&
+            primType != PrimType.HexBinary =>
         new SpecifiedLengthImplicit(this, body, implicitBinaryLengthInBits)
-      case LengthKind.Implicit if isComplexType =>
+      case LengthKind.Implicit =>
         body // for complex types, implicit means "roll up from the bottom"
+      // for simple types, the primitives have custom parsers that handle implicit length logic
+      // and don't use the limit provided by the SpecifiedLengthImplicit parser
       case LengthKind.EndOfParent if isComplexType =>
         notYetImplemented("lengthKind='endOfParent' for complex type")
       case LengthKind.EndOfParent =>
@@ -1403,7 +1419,7 @@ trait ElementBaseGrammarMixin
   private lazy val sharedComplexContentRegion: Gram =
     schemaSet.sharedComplexContentFactory.getShared(
       shareKey,
-      captureLengthRegions(EmptyGram, specifiedLength(complexContent), elementUnused) ~
+      captureLengthRegions(EmptyGram, complexContent, elementUnused) ~
         terminatorRegion
     )
 

diff --git a/daffodil-core/src/main/scala/org/apache/daffodil/core/grammar/primitives/PrimitivesBCD.scala b/daffodil-core/src/main/scala/org/apache/daffodil/core/grammar/primitives/PrimitivesBCD.scala
@@ -19,18 +19,18 @@ package org.apache.daffodil.core.grammar.primitives
 
 import org.apache.daffodil.core.dsom.ElementBase
 import org.apache.daffodil.core.grammar.Terminal
+import org.apache.daffodil.runtime1.processors.parsers.BCDDecimalBitLimitLengthParser
 import org.apache.daffodil.runtime1.processors.parsers.BCDDecimalKnownLengthParser
-import org.apache.daffodil.runtime1.processors.parsers.BCDDecimalPrefixedLengthParser
 import org.apache.daffodil.runtime1.processors.parsers.BCDDecimalRuntimeLengthParser
+import org.apache.daffodil.runtime1.processors.parsers.BCDIntegerBitLimitLengthParser
 import org.apache.daffodil.runtime1.processors.parsers.BCDIntegerKnownLengthParser
-import org.apache.daffodil.runtime1.processors.parsers.BCDIntegerPrefixedLengthParser
 import org.apache.daffodil.runtime1.processors.parsers.BCDIntegerRuntimeLengthParser
 import org.apache.daffodil.runtime1.processors.unparsers.Unparser
 import org.apache.daffodil.unparsers.runtime1.BCDDecimalKnownLengthUnparser
-import org.apache.daffodil.unparsers.runtime1.BCDDecimalPrefixedLengthUnparser
+import org.apache.daffodil.unparsers.runtime1.BCDDecimalMinimumLengthUnparser
 import org.apache.daffodil.unparsers.runtime1.BCDDecimalRuntimeLengthUnparser
 import org.apache.daffodil.unparsers.runtime1.BCDIntegerKnownLengthUnparser
-import org.apache.daffodil.unparsers.runtime1.BCDIntegerPrefixedLengthUnparser
+import org.apache.daffodil.unparsers.runtime1.BCDIntegerMinimumLengthUnparser
 import org.apache.daffodil.unparsers.runtime1.BCDIntegerRuntimeLengthUnparser
 
 class BCDIntegerRuntimeLength(val e: ElementBase) extends Terminal(e, true) {
@@ -52,20 +52,10 @@ class BCDIntegerKnownLength(val e: ElementBase, lengthInBits: Long) extends Term
 
 class BCDIntegerPrefixedLength(val e: ElementBase) extends Terminal(e, true) {
 
-  override lazy val parser = new BCDIntegerPrefixedLengthParser(
-    e.elementRuntimeData,
-    e.prefixedLengthBody.parser,
-    e.prefixedLengthElementDecl.elementRuntimeData,
-    e.lengthUnits,
-    e.prefixedLengthAdjustmentInUnits
-  )
+  override lazy val parser = new BCDIntegerBitLimitLengthParser(e.elementRuntimeData)
 
-  override lazy val unparser: Unparser = new BCDIntegerPrefixedLengthUnparser(
-    e.elementRuntimeData,
-    e.prefixedLengthBody.unparser,
-    e.prefixedLengthElementDecl.elementRuntimeData,
-    e.lengthUnits,
-    e.prefixedLengthAdjustmentInUnits
+  override lazy val unparser: Unparser = new BCDIntegerMinimumLengthUnparser(
+    e.elementRuntimeData
   )
 }
 
@@ -102,21 +92,9 @@ class BCDDecimalKnownLength(val e: ElementBase, lengthInBits: Long) extends Term
 
 class BCDDecimalPrefixedLength(val e: ElementBase) extends Terminal(e, true) {
 
-  override lazy val parser = new BCDDecimalPrefixedLengthParser(
-    e.elementRuntimeData,
-    e.prefixedLengthBody.parser,
-    e.prefixedLengthElementDecl.elementRuntimeData,
-    e.binaryDecimalVirtualPoint,
-    e.lengthUnits,
-    e.prefixedLengthAdjustmentInUnits
-  )
+  override lazy val parser =
+    new BCDDecimalBitLimitLengthParser(e.elementRuntimeData, e.binaryDecimalVirtualPoint)
 
-  override lazy val unparser: Unparser = new BCDDecimalPrefixedLengthUnparser(
-    e.elementRuntimeData,
-    e.prefixedLengthBody.unparser,
-    e.prefixedLengthElementDecl.elementRuntimeData,
-    e.binaryDecimalVirtualPoint,
-    e.lengthUnits,
-    e.prefixedLengthAdjustmentInUnits
-  )
+  override lazy val unparser: Unparser =
+    new BCDDecimalMinimumLengthUnparser(e.elementRuntimeData, e.binaryDecimalVirtualPoint)
 }
diff --git a/.../src/main/scala/org/apache/daffodil/core/grammar/primitives/PrimitivesBinaryBoolean.scala b/.../src/main/scala/org/apache/daffodil/core/grammar/primitives/PrimitivesBinaryBoolean.scala
@@ -19,10 +19,10 @@ package org.apache.daffodil.core.grammar.primitives
 
 import org.apache.daffodil.core.dsom.ElementBase
 import org.apache.daffodil.core.grammar.Terminal
+import org.apache.daffodil.runtime1.processors.parsers.BinaryBooleanBitLimitLengthParser
 import org.apache.daffodil.runtime1.processors.parsers.BinaryBooleanParser
-import org.apache.daffodil.runtime1.processors.parsers.BinaryBooleanPrefixedLengthParser
 import org.apache.daffodil.runtime1.processors.unparsers.Unparser
-import org.apache.daffodil.unparsers.runtime1.BinaryBooleanPrefixedLengthUnparser
+import org.apache.daffodil.unparsers.runtime1.BinaryBooleanMinimumLengthUnparser
 import org.apache.daffodil.unparsers.runtime1.BinaryBooleanUnparser
 
 class BinaryBoolean(val e: ElementBase) extends Terminal(e, true) {
@@ -46,23 +46,17 @@ class BinaryBoolean(val e: ElementBase) extends Terminal(e, true) {
 }
 
 class BinaryBooleanPrefixedLength(val e: ElementBase) extends Terminal(e, true) {
-  override lazy val parser = new BinaryBooleanPrefixedLengthParser(
+  override lazy val parser = new BinaryBooleanBitLimitLengthParser(
     e.elementRuntimeData,
-    e.prefixedLengthBody.parser,
-    e.prefixedLengthElementDecl.elementRuntimeData,
     e.binaryBooleanTrueRep,
     e.binaryBooleanFalseRep,
-    e.lengthUnits,
-    e.prefixedLengthAdjustmentInUnits
+    e.lengthUnits
   )
 
-  override lazy val unparser: Unparser = new BinaryBooleanPrefixedLengthUnparser(
+  override lazy val unparser: Unparser = new BinaryBooleanMinimumLengthUnparser(
     e.elementRuntimeData,
-    e.prefixedLengthBody.unparser,
-    e.prefixedLengthElementDecl.elementRuntimeData,
     e.binaryBooleanTrueRep,
     e.binaryBooleanFalseRep,
-    e.lengthUnits,
-    e.prefixedLengthAdjustmentInUnits
+    e.lengthUnits
   )
 }
diff --git a/...e/src/main/scala/org/apache/daffodil/core/grammar/primitives/PrimitivesBinaryNumber.scala b/...e/src/main/scala/org/apache/daffodil/core/grammar/primitives/PrimitivesBinaryNumber.scala
@@ -22,22 +22,22 @@ import org.apache.daffodil.core.grammar.Terminal
 import org.apache.daffodil.lib.exceptions.Assert
 import org.apache.daffodil.lib.util.MaybeInt
 import org.apache.daffodil.runtime1.dpath.NodeInfo
+import org.apache.daffodil.runtime1.processors.parsers.BinaryDecimalBitLimitLengthParser
 import org.apache.daffodil.runtime1.processors.parsers.BinaryDecimalKnownLengthParser
-import org.apache.daffodil.runtime1.processors.parsers.BinaryDecimalPrefixedLengthParser
 import org.apache.daffodil.runtime1.processors.parsers.BinaryDecimalRuntimeLengthParser
 import org.apache.daffodil.runtime1.processors.parsers.BinaryDoubleParser
 import org.apache.daffodil.runtime1.processors.parsers.BinaryFloatParser
+import org.apache.daffodil.runtime1.processors.parsers.BinaryIntegerBitLimitLengthParser
 import org.apache.daffodil.runtime1.processors.parsers.BinaryIntegerKnownLengthParser
-import org.apache.daffodil.runtime1.processors.parsers.BinaryIntegerPrefixedLengthParser
 import org.apache.daffodil.runtime1.processors.parsers.BinaryIntegerRuntimeLengthParser
 import org.apache.daffodil.runtime1.processors.unparsers.Unparser
 import org.apache.daffodil.unparsers.runtime1.BinaryDecimalKnownLengthUnparser
-import org.apache.daffodil.unparsers.runtime1.BinaryDecimalPrefixedLengthUnparser
+import org.apache.daffodil.unparsers.runtime1.BinaryDecimalMinimumLengthUnparser
 import org.apache.daffodil.unparsers.runtime1.BinaryDecimalRuntimeLengthUnparser
 import org.apache.daffodil.unparsers.runtime1.BinaryDoubleUnparser
 import org.apache.daffodil.unparsers.runtime1.BinaryFloatUnparser
 import org.apache.daffodil.unparsers.runtime1.BinaryIntegerKnownLengthUnparser
-import org.apache.daffodil.unparsers.runtime1.BinaryIntegerPrefixedLengthUnparser
+import org.apache.daffodil.unparsers.runtime1.BinaryIntegerMinimumLengthUnparser
 import org.apache.daffodil.unparsers.runtime1.BinaryIntegerRuntimeLengthUnparser
 
 class BinaryIntegerRuntimeLength(val e: ElementBase, signed: Boolean)
@@ -77,14 +77,7 @@ class BinaryIntegerPrefixedLength(val e: ElementBase, signed: Boolean)
   private lazy val pladj = e.prefixedLengthAdjustmentInUnits
 
   override lazy val parser =
-    new BinaryIntegerPrefixedLengthParser(
-      erd,
-      e.prefixedLengthBody.parser,
-      plerd,
-      signed,
-      e.lengthUnits,
-      pladj
-    )
+    new BinaryIntegerBitLimitLengthParser(erd, signed)
 
   override lazy val unparser: Unparser = {
     val maybeNBits = e.primType match {
@@ -96,15 +89,7 @@ class BinaryIntegerPrefixedLength(val e: ElementBase, signed: Boolean)
       case _ =>
         Assert.invariantFailed("Only integer base types should be used for this primitive")
     }
-    new BinaryIntegerPrefixedLengthUnparser(
-      erd,
-      e.prefixedLengthBody.unparser,
-      plerd,
-      maybeNBits,
-      signed,
-      e.lengthUnits,
-      pladj
-    )
+    new BinaryIntegerMinimumLengthUnparser(erd, maybeNBits, signed)
   }
 }
 
@@ -149,25 +134,17 @@ class BinaryDecimalKnownLength(val e: ElementBase, lengthInBits: Long)
 class BinaryDecimalPrefixedLength(val e: ElementBase) extends Terminal(e, true) {
 
   override lazy val parser =
-    new BinaryDecimalPrefixedLengthParser(
+    new BinaryDecimalBitLimitLengthParser(
       e.elementRuntimeData,
-      e.prefixedLengthBody.parser,
-      e.prefixedLengthElementDecl.elementRuntimeData,
       e.decimalSigned,
-      e.binaryDecimalVirtualPoint,
-      e.lengthUnits,
-      e.prefixedLengthAdjustmentInUnits
+      e.binaryDecimalVirtualPoint
     )
 
   override lazy val unparser: Unparser =
-    new BinaryDecimalPrefixedLengthUnparser(
+    new BinaryDecimalMinimumLengthUnparser(
       e.elementRuntimeData,
-      e.prefixedLengthBody.unparser,
-      e.prefixedLengthElementDecl.elementRuntimeData,
       e.decimalSigned,
-      e.binaryDecimalVirtualPoint,
-      e.lengthUnits,
-      e.prefixedLengthAdjustmentInUnits
+      e.binaryDecimalVirtualPoint
     )
 
 }