Possible TypeError under Py2

[pyderasn.git] / pyderasn.py
diff --git a/pyderasn.py b/pyderasn.py

index 68d67d07e91a746886d22bb629d19a8ae6000f43..b9bc9dae515564a24dcc052005754d54993fca03 100755 (executable)
--- a/pyderasn.py
+++ b/pyderasn.py
@@ -1,6 +1,6 @@
  #!/usr/bin/env python
  # coding: utf-8
-# PyDERASN -- Python ASN.1 DER codec with abstract structures
+# PyDERASN -- Python ASN.1 DER/BER codec with abstract structures
  # Copyright (C) 2017-2018 Sergey Matveev <stargrave@stargrave.org>
  #
  # This program is free software: you can redistribute it and/or modify
@@ -16,10 +16,10 @@
  # You should have received a copy of the GNU Lesser General Public
  # License along with this program.  If not, see
  # <http://www.gnu.org/licenses/>.
-"""Python ASN.1 DER codec with abstract structures
+"""Python ASN.1 DER/BER codec with abstract structures
  
-This library allows you to marshal and unmarshal various structures in
-ASN.1 DER format, like this:
+This library allows you to marshal various structures in ASN.1 DER
+format, unmarshal them in BER/CER/DER ones.
  
      >>> i = Integer(123)
      >>> raw = i.encode()
@@ -189,11 +189,18 @@ use following properties:
  
  Pay attention that those values do **not** include anything related to
  explicit tag. If you want to know information about it, then use:
-``expled`` (to know if explicit tag is set), ``expl_offset`` (it is
-lesser than ``offset``), ``expl_tlen``, ``expl_llen``, ``expl_vlen``
-(that actually equals to ordinary ``tlvlen``).
  
-When error occurs, then :py:exc:`pyderasn.DecodeError` is raised.
+* ``expled`` -- to know if explicit tag is set
+* ``expl_offset`` (it is lesser than ``offset``)
+* ``expl_tlen``,
+* ``expl_llen``
+* ``expl_vlen`` (that actually equals to ordinary ``tlvlen``)
+* ``fulloffset`` -- it equals to ``expl_offset`` if explicit tag is set,
+  ``offset`` otherwise
+* ``fulllen`` -- it equals to ``expl_len`` if explicit tag is set,
+  ``tlvlen`` otherwise
+
+When error occurs, :py:exc:`pyderasn.DecodeError` is raised.
  
  .. _ctx:
  
@@ -206,6 +213,7 @@ decoding process.
  
  Currently available context options:
  
+* :ref:`bered <bered_ctx>`
  * :ref:`defines_by_path <defines_by_path_ctx>`
  * :ref:`strict_default_existence <strict_default_existence_ctx>`
  
@@ -363,6 +371,29 @@ First function is useful for path construction when some automatic
  decoding is already done. ``any`` means literally any value it meet --
  useful for SEQUENCE/SET OF-s.
  
+.. _bered_ctx:
+
+BER encoding
+------------
+
+By default PyDERASN accepts only DER encoded data. It always encodes to
+DER. But you can optionally enable BER decoding with setting ``bered``
+:ref:`context <ctx>` argument to True. Indefinite lengths and
+constructed primitive types should be parsed successfully.
+
+* If object is encoded in BER form (not the DER one), then ``bered``
+  attribute is set to True. Only ``BOOLEAN``, ``BIT STRING``, ``OCTET
+  STRING`` can contain it.
+* If object has an indefinite length encoding, then its ``lenindef``
+  attribute is set to True. Only ``BIT STRING``, ``OCTET STRING``,
+  ``SEQUENCE``, ``SET``, ``SEQUENCE OF``, ``SET OF``, ``ANY`` can
+  contain it.
+* If object has an indefinite length encoded explicit tag, then
+  ``expl_lenindef`` is set to True.
+
+EOC (end-of-contents) token's length is taken in advance in object's
+value length.
+
  Primitive types
  ---------------
  
@@ -404,6 +435,10 @@ CommonString
  ____________
  .. autoclass:: pyderasn.CommonString
  
+NumericString
+_____________
+.. autoclass:: pyderasn.NumericString
+
  UTCTime
  _______
  .. autoclass:: pyderasn.UTCTime
@@ -464,6 +499,17 @@ Various
  .. autofunction:: pyderasn.tag_ctxp
  .. autofunction:: pyderasn.tag_ctxc
  .. autoclass:: pyderasn.Obj
+.. autoclass:: pyderasn.DecodeError
+   :members: __init__
+.. autoclass:: pyderasn.NotEnoughData
+.. autoclass:: pyderasn.LenIndefForm
+.. autoclass:: pyderasn.TagMismatch
+.. autoclass:: pyderasn.InvalidLength
+.. autoclass:: pyderasn.InvalidOID
+.. autoclass:: pyderasn.ObjUnknown
+.. autoclass:: pyderasn.ObjNotReady
+.. autoclass:: pyderasn.InvalidValueType
+.. autoclass:: pyderasn.BoundsError
  """
  
  from codecs import getdecoder
@@ -516,6 +562,7 @@ __all__ = (
      "InvalidOID",
      "InvalidValueType",
      "ISO646String",
+    "LenIndefForm",
      "NotEnoughData",
      "Null",
      "NumericString",
@@ -561,6 +608,10 @@ TagClassReprs = {
      TagClassPrivate: "PRIVATE ",
      TagClassUniversal: "UNIV ",
  }
+EOC = b"\x00\x00"
+EOC_LEN = len(EOC)
+LENINDEF = b"\x80"  # length indefinite mark
+LENINDEF_PP_CHAR = "I" if PY2 else "∞"
  
  
  ########################################################################
@@ -606,6 +657,10 @@ class NotEnoughData(DecodeError):
      pass
  
  
+class LenIndefForm(DecodeError):
+    pass
+
+
  class TagMismatch(DecodeError):
      pass
  
@@ -797,6 +852,11 @@ def len_encode(l):
  
  
  def len_decode(data):
+    """Decode length
+
+    :returns: (decoded length, length's length, remaining data)
+    :raises LenIndefForm: if indefinite form encoding is met
+    """
      if len(data) == 0:
          raise NotEnoughData("no data at all")
      first_octet = byte2int(data)
@@ -806,7 +866,7 @@ def len_decode(data):
      if octets_num + 1 > len(data):
          raise NotEnoughData("encoded length is longer than data")
      if octets_num == 0:
-        raise DecodeError("long form instead of short one")
+        raise LenIndefForm()
      if byte2int(data[1:]) == 0:
          raise DecodeError("leading zeros")
      l = 0
@@ -843,6 +903,9 @@ class Obj(object):
          "offset",
          "llen",
          "vlen",
+        "expl_lenindef",
+        "lenindef",
+        "bered",
      )
  
      def __init__(
@@ -856,14 +919,15 @@ class Obj(object):
          self.tag = getattr(self, "impl", self.tag_default) if impl is None else impl
          self._expl = getattr(self, "expl", None) if expl is None else expl
          if self.tag != self.tag_default and self._expl is not None:
-            raise ValueError(
-                "implicit and explicit tags can not be set simultaneously"
-            )
+            raise ValueError("implicit and explicit tags can not be set simultaneously")
          if default is not None:
              optional = True
          self.optional = optional
          self.offset, self.llen, self.vlen = _decoded
          self.default = None
+        self.expl_lenindef = False
+        self.lenindef = False
+        self.bered = False
  
      @property
      def ready(self):  # pragma: no cover
@@ -974,6 +1038,36 @@ class Obj(object):
                  )
              try:
                  l, llen, v = len_decode(lv)
+            except LenIndefForm as err:
+                if not ctx.get("bered", False):
+                    raise err.__class__(
+                        msg=err.msg,
+                        klass=self.__class__,
+                        decode_path=decode_path,
+                        offset=offset,
+                    )
+                llen, v = 1, lv[1:]
+                offset += tlen + llen
+                result = self._decode(
+                    v,
+                    offset=offset,
+                    decode_path=decode_path,
+                    ctx=ctx,
+                    tag_only=tag_only,
+                )
+                if tag_only:
+                    return
+                obj, tail = result
+                eoc_expected, tail = tail[:EOC_LEN], tail[EOC_LEN:]
+                if eoc_expected.tobytes() != EOC:
+                    raise DecodeError(
+                        "no EOC",
+                        klass=self.__class__,
+                        decode_path=decode_path,
+                        offset=offset,
+                    )
+                obj.vlen += EOC_LEN
+                obj.expl_lenindef = True
              except DecodeError as err:
                  raise err.__class__(
                      msg=err.msg,
@@ -981,23 +1075,24 @@ class Obj(object):
                      decode_path=decode_path,
                      offset=offset,
                  )
-            if l > len(v):
-                raise NotEnoughData(
-                    "encoded length is longer than data",
-                    klass=self.__class__,
+            else:
+                if l > len(v):
+                    raise NotEnoughData(
+                        "encoded length is longer than data",
+                        klass=self.__class__,
+                        decode_path=decode_path,
+                        offset=offset,
+                    )
+                result = self._decode(
+                    v,
+                    offset=offset + tlen + llen,
                      decode_path=decode_path,
-                    offset=offset,
+                    ctx=ctx,
+                    tag_only=tag_only,
                  )
-            result = self._decode(
-                v,
-                offset=offset + tlen + llen,
-                decode_path=decode_path,
-                ctx=ctx,
-                tag_only=tag_only,
-            )
-            if tag_only:
-                return
-            obj, tail = result
+                if tag_only:
+                    return
+                obj, tail = result
          return obj, (tail if leavemm else tail.tobytes())
  
      @property
@@ -1014,6 +1109,8 @@ class Obj(object):
  
      @property
      def expl_llen(self):
+        if self.expl_lenindef:
+            return 1
          return len(len_encode(self.tlvlen))
  
      @property
@@ -1028,6 +1125,41 @@ class Obj(object):
      def expl_tlvlen(self):
          return self.expl_tlen + self.expl_llen + self.expl_vlen
  
+    @property
+    def fulloffset(self):
+        return self.expl_offset if self.expled else self.offset
+
+    @property
+    def fulllen(self):
+        return self.expl_tlvlen if self.expled else self.tlvlen
+
+    def pps_lenindef(self, decode_path):
+        if self.lenindef:
+            yield _pp(
+                asn1_type_name="EOC",
+                obj_name="",
+                decode_path=decode_path,
+                offset=(
+                    self.offset + self.tlvlen -
+                    (EOC_LEN * 2 if self.expl_lenindef else EOC_LEN)
+                ),
+                tlen=1,
+                llen=1,
+                vlen=0,
+                bered=True,
+            )
+        if self.expl_lenindef:
+            yield _pp(
+                asn1_type_name="EOC",
+                obj_name="EXPLICIT",
+                decode_path=decode_path,
+                offset=self.expl_offset + self.expl_tlvlen - EOC_LEN,
+                tlen=1,
+                llen=1,
+                vlen=0,
+                bered=True,
+            )
+
  
  class DecodePathDefBy(object):
      """DEFINED BY representation inside decode path
@@ -1074,6 +1206,9 @@ PP = namedtuple("PP", (
      "expl_tlen",
      "expl_llen",
      "expl_vlen",
+    "expl_lenindef",
+    "lenindef",
+    "bered",
  ))
  
  
@@ -1095,6 +1230,9 @@ def _pp(
          expl_tlen=None,
          expl_llen=None,
          expl_vlen=None,
+        expl_lenindef=False,
+        lenindef=False,
+        bered=False,
  ):
      return PP(
          asn1_type_name,
@@ -1114,6 +1252,9 @@ def _pp(
          expl_tlen,
          expl_llen,
          expl_vlen,
+        expl_lenindef,
+        lenindef,
+        bered,
      )
  
  
@@ -1130,16 +1271,23 @@ def pp_console_row(
  ):
      cols = []
      if with_offsets:
-        col = "%5d%s" % (
+        col = "%5d%s%s" % (
              pp.offset,
              (
                  "  " if pp.expl_offset is None else
                  ("-%d" % (pp.offset - pp.expl_offset))
              ),
+            LENINDEF_PP_CHAR if pp.expl_lenindef else " ",
          )
          cols.append(_colorize(col, "red", with_colours, ()))
-        col = "[%d,%d,%4d]" % (pp.tlen, pp.llen, pp.vlen)
-        cols.append(_colorize(col, "green", with_colours, ()))
+        col = "[%d,%d,%4d]%s" % (
+            pp.tlen,
+            pp.llen,
+            pp.vlen,
+            LENINDEF_PP_CHAR if pp.lenindef else " "
+        )
+        col = _colorize(col, "green", with_colours, ())
+        cols.append(col)
      if len(pp.decode_path) > 0:
          cols.append(" ." * (len(pp.decode_path)))
          ent = pp.decode_path[-1]
@@ -1167,6 +1315,8 @@ def pp_console_row(
          cols.append(_colorize(col, "blue", with_colours))
      if pp.asn1_type_name.replace(" ", "") != pp.obj_name.upper():
          cols.append(_colorize(pp.obj_name, "magenta", with_colours))
+    if pp.bered:
+        cols.append(_colorize("BER", "red", with_colours))
      cols.append(_colorize(pp.asn1_type_name, "cyan", with_colours))
      if pp.value is not None:
          value = pp.value
@@ -1190,7 +1340,7 @@ def pp_console_row(
  
  
  def pp_console_blob(pp):
-    cols = [" " * len("XXXXXYY [X,X,XXXX]")]
+    cols = [" " * len("XXXXXYYZ [X,X,XXXX]Z")]
      if len(pp.decode_path) > 0:
          cols.append(" ." * (len(pp.decode_path) + 1))
      if isinstance(pp.blob, binary_type):
@@ -1398,10 +1548,14 @@ class Boolean(Obj):
                  offset=offset,
              )
          first_octet = byte2int(v)
+        bered = False
          if first_octet == 0:
              value = False
          elif first_octet == 0xFF:
              value = True
+        elif ctx.get("bered", False):
+            value = True
+            bered = True
          else:
              raise DecodeError(
                  "unacceptable Boolean value",
@@ -1417,6 +1571,7 @@ class Boolean(Obj):
              optional=self.optional,
              _decoded=(offset, 1, 1),
          )
+        obj.bered = bered
          return obj, v[1:]
  
      def __repr__(self):
@@ -1440,7 +1595,11 @@ class Boolean(Obj):
              expl_tlen=self.expl_tlen if self.expled else None,
              expl_llen=self.expl_llen if self.expled else None,
              expl_vlen=self.expl_vlen if self.expled else None,
+            expl_lenindef=self.expl_lenindef,
+            bered=self.bered,
          )
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  class Integer(Obj):
@@ -1762,7 +1921,10 @@ class Integer(Obj):
              expl_tlen=self.expl_tlen if self.expled else None,
              expl_llen=self.expl_llen if self.expled else None,
              expl_vlen=self.expl_vlen if self.expled else None,
+            expl_lenindef=self.expl_lenindef,
          )
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  class BitString(Obj):
@@ -1777,6 +1939,8 @@ class BitString(Obj):
      >>> b.bit_len
      88
  
+    >>> BitString("'0A3B5F291CD'H")
+    BIT STRING 44 bits 0a3b5f291cd0
      >>> b = BitString("'010110000000'B")
      BIT STRING 12 bits 5800
      >>> b.bit_len
@@ -1803,8 +1967,16 @@ class BitString(Obj):
      ['nonRepudiation', 'keyEncipherment']
      >>> b.specs
      {'nonRepudiation': 1, 'digitalSignature': 0, 'keyEncipherment': 2}
+
+    .. note::
+
+       Pay attention that BIT STRING can be encoded both in primitive
+       and constructed forms. Decoder always checks constructed form tag
+       additionally to specified primitive one. If BER decoding is
+       :ref:`not enabled <bered_ctx>`, then decoder will fail, because
+       of DER restrictions.
      """
-    __slots__ = ("specs", "defined")
+    __slots__ = ("tag_constructed", "specs", "defined")
      tag_default = tag_encode(3)
      asn1_type_name = "BIT STRING"
  
@@ -1842,6 +2014,12 @@ class BitString(Obj):
              if value is None:
                  self._value = default
          self.defined = None
+        tag_klass, _, tag_num = tag_decode(self.tag)
+        self.tag_constructed = tag_encode(
+            klass=tag_klass,
+            form=TagFormConstructed,
+            num=tag_num,
+        )
  
      def _bits2octets(self, bits):
          if len(self.specs) > 0:
@@ -1859,21 +2037,23 @@ class BitString(Obj):
          if isinstance(value, (string_types, binary_type)):
              if (
                      isinstance(value, string_types) and
-                    value.startswith("'") and
-                    value.endswith("'B")
+                    value.startswith("'")
              ):
-                value = value[1:-2]
-                if not set(value) <= set(("0", "1")):
-                    raise ValueError("B's coding contains unacceptable chars")
-                return self._bits2octets(value)
-            elif isinstance(value, binary_type):
+                if value.endswith("'B"):
+                    value = value[1:-2]
+                    if not set(value) <= set(("0", "1")):
+                        raise ValueError("B's coding contains unacceptable chars")
+                    return self._bits2octets(value)
+                elif value.endswith("'H"):
+                    value = value[1:-2]
+                    return (
+                        len(value) * 4,
+                        hexdec(value + ("" if len(value) % 2 == 0 else "0")),
+                    )
+            if isinstance(value, binary_type):
                  return (len(value) * 8, value)
              else:
-                raise InvalidValueType((
-                    self.__class__,
-                    string_types,
-                    binary_type,
-                ))
+                raise InvalidValueType((self.__class__, string_types, binary_type))
          if isinstance(value, tuple):
              if (
                      len(value) == 2 and
@@ -1987,24 +2167,7 @@ class BitString(Obj):
              octets,
          ))
  
-    def _decode(self, tlv, offset, decode_path, ctx, tag_only):
-        try:
-            t, _, lv = tag_strip(tlv)
-        except DecodeError as err:
-            raise err.__class__(
-                msg=err.msg,
-                klass=self.__class__,
-                decode_path=decode_path,
-                offset=offset,
-            )
-        if t != self.tag:
-            raise TagMismatch(
-                klass=self.__class__,
-                decode_path=decode_path,
-                offset=offset,
-            )
-        if tag_only:
-            return
+    def _decode_chunk(self, lv, offset, decode_path, ctx):
          try:
              l, llen, v = len_decode(lv)
          except DecodeError as err:
@@ -2062,6 +2225,134 @@ class BitString(Obj):
          )
          return obj, tail
  
+    def _decode(self, tlv, offset, decode_path, ctx, tag_only):
+        try:
+            t, tlen, lv = tag_strip(tlv)
+        except DecodeError as err:
+            raise err.__class__(
+                msg=err.msg,
+                klass=self.__class__,
+                decode_path=decode_path,
+                offset=offset,
+            )
+        if t == self.tag:
+            if tag_only:
+                return
+            return self._decode_chunk(lv, offset, decode_path, ctx)
+        if t == self.tag_constructed:
+            if not ctx.get("bered", False):
+                raise DecodeError(
+                    "unallowed BER constructed encoding",
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            if tag_only:
+                return
+            lenindef = False
+            try:
+                l, llen, v = len_decode(lv)
+            except LenIndefForm:
+                llen, l, v = 1, 0, lv[1:]
+                lenindef = True
+            except DecodeError as err:
+                raise err.__class__(
+                    msg=err.msg,
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            if l > len(v):
+                raise NotEnoughData(
+                    "encoded length is longer than data",
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            if not lenindef and l == 0:
+                raise NotEnoughData(
+                    "zero length",
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            chunks = []
+            sub_offset = offset + tlen + llen
+            vlen = 0
+            while True:
+                if lenindef:
+                    if v[:EOC_LEN].tobytes() == EOC:
+                        break
+                else:
+                    if vlen == l:
+                        break
+                    if vlen > l:
+                        raise DecodeError(
+                            "chunk out of bounds",
+                            klass=self.__class__,
+                            decode_path=decode_path + (str(len(chunks) - 1),),
+                            offset=chunks[-1].offset,
+                        )
+                sub_decode_path = decode_path + (str(len(chunks)),)
+                try:
+                    chunk, v_tail = BitString().decode(
+                        v,
+                        offset=sub_offset,
+                        decode_path=sub_decode_path,
+                        leavemm=True,
+                        ctx=ctx,
+                    )
+                except TagMismatch:
+                    raise DecodeError(
+                        "expected BitString encoded chunk",
+                        klass=self.__class__,
+                        decode_path=sub_decode_path,
+                        offset=sub_offset,
+                    )
+                chunks.append(chunk)
+                sub_offset += chunk.tlvlen
+                vlen += chunk.tlvlen
+                v = v_tail
+            if len(chunks) == 0:
+                raise DecodeError(
+                    "no chunks",
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            values = []
+            bit_len = 0
+            for chunk_i, chunk in enumerate(chunks[:-1]):
+                if chunk.bit_len % 8 != 0:
+                    raise DecodeError(
+                        "BitString chunk is not multiple of 8 bits",
+                        klass=self.__class__,
+                        decode_path=decode_path + (str(chunk_i),),
+                        offset=chunk.offset,
+                    )
+                values.append(bytes(chunk))
+                bit_len += chunk.bit_len
+            chunk_last = chunks[-1]
+            values.append(bytes(chunk_last))
+            bit_len += chunk_last.bit_len
+            obj = self.__class__(
+                value=(bit_len, b"".join(values)),
+                impl=self.tag,
+                expl=self._expl,
+                default=self.default,
+                optional=self.optional,
+                _specs=self.specs,
+                _decoded=(offset, llen, vlen + (EOC_LEN if lenindef else 0)),
+            )
+            obj.lenindef = lenindef
+            obj.bered = True
+            return obj, (v[EOC_LEN:] if lenindef else v)
+        raise TagMismatch(
+            klass=self.__class__,
+            decode_path=decode_path,
+            offset=offset,
+        )
+
      def __repr__(self):
          return pp_console_row(next(self.pps()))
  
@@ -2091,12 +2382,17 @@ class BitString(Obj):
              expl_tlen=self.expl_tlen if self.expled else None,
              expl_llen=self.expl_llen if self.expled else None,
              expl_vlen=self.expl_vlen if self.expled else None,
+            expl_lenindef=self.expl_lenindef,
+            lenindef=self.lenindef,
+            bered=self.bered,
          )
          defined_by, defined = self.defined or (None, None)
          if defined_by is not None:
              yield defined.pps(
                  decode_path=decode_path + (DecodePathDefBy(defined_by),)
              )
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  class OctetString(Obj):
@@ -2114,8 +2410,16 @@ class OctetString(Obj):
      pyderasn.BoundsError: unsatisfied bounds: 4 <= 5 <= 4
      >>> OctetString(b"hell", bounds=(4, 4))
      OCTET STRING 4 bytes 68656c6c
+
+    .. note::
+
+       Pay attention that OCTET STRING can be encoded both in primitive
+       and constructed forms. Decoder always checks constructed form tag
+       additionally to specified primitive one. If BER decoding is
+       :ref:`not enabled <bered_ctx>`, then decoder will fail, because
+       of DER restrictions.
      """
-    __slots__ = ("_bound_min", "_bound_max", "defined")
+    __slots__ = ("tag_constructed", "_bound_min", "_bound_max", "defined")
      tag_default = tag_encode(4)
      asn1_type_name = "OCTET STRING"
  
@@ -2164,6 +2468,12 @@ class OctetString(Obj):
              if self._value is None:
                  self._value = default
          self.defined = None
+        tag_klass, _, tag_num = tag_decode(self.tag)
+        self.tag_constructed = tag_encode(
+            klass=tag_klass,
+            form=TagFormConstructed,
+            num=tag_num,
+        )
  
      def _value_sanitize(self, value):
          if issubclass(value.__class__, OctetString):
@@ -2241,24 +2551,7 @@ class OctetString(Obj):
              self._value,
          ))
  
-    def _decode(self, tlv, offset, decode_path, ctx, tag_only):
-        try:
-            t, _, lv = tag_strip(tlv)
-        except DecodeError as err:
-            raise err.__class__(
-                msg=err.msg,
-                klass=self.__class__,
-                decode_path=decode_path,
-                offset=offset,
-            )
-        if t != self.tag:
-            raise TagMismatch(
-                klass=self.__class__,
-                decode_path=decode_path,
-                offset=offset,
-            )
-        if tag_only:
-            return
+    def _decode_chunk(self, lv, offset, decode_path, ctx):
          try:
              l, llen, v = len_decode(lv)
          except DecodeError as err:
@@ -2302,6 +2595,120 @@ class OctetString(Obj):
              )
          return obj, tail
  
+    def _decode(self, tlv, offset, decode_path, ctx, tag_only):
+        try:
+            t, tlen, lv = tag_strip(tlv)
+        except DecodeError as err:
+            raise err.__class__(
+                msg=err.msg,
+                klass=self.__class__,
+                decode_path=decode_path,
+                offset=offset,
+            )
+        if t == self.tag:
+            if tag_only:
+                return
+            return self._decode_chunk(lv, offset, decode_path, ctx)
+        if t == self.tag_constructed:
+            if not ctx.get("bered", False):
+                raise DecodeError(
+                    "unallowed BER constructed encoding",
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            if tag_only:
+                return
+            lenindef = False
+            try:
+                l, llen, v = len_decode(lv)
+            except LenIndefForm:
+                llen, l, v = 1, 0, lv[1:]
+                lenindef = True
+            except DecodeError as err:
+                raise err.__class__(
+                    msg=err.msg,
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            if l > len(v):
+                raise NotEnoughData(
+                    "encoded length is longer than data",
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            chunks = []
+            sub_offset = offset + tlen + llen
+            vlen = 0
+            while True:
+                if lenindef:
+                    if v[:EOC_LEN].tobytes() == EOC:
+                        break
+                else:
+                    if vlen == l:
+                        break
+                    if vlen > l:
+                        raise DecodeError(
+                            "chunk out of bounds",
+                            klass=self.__class__,
+                            decode_path=decode_path + (str(len(chunks) - 1),),
+                            offset=chunks[-1].offset,
+                        )
+                sub_decode_path = decode_path + (str(len(chunks)),)
+                try:
+                    chunk, v_tail = OctetString().decode(
+                        v,
+                        offset=sub_offset,
+                        decode_path=sub_decode_path,
+                        leavemm=True,
+                        ctx=ctx,
+                    )
+                except TagMismatch:
+                    raise DecodeError(
+                        "expected OctetString encoded chunk",
+                        klass=self.__class__,
+                        decode_path=sub_decode_path,
+                        offset=sub_offset,
+                    )
+                chunks.append(chunk)
+                sub_offset += chunk.tlvlen
+                vlen += chunk.tlvlen
+                v = v_tail
+            try:
+                obj = self.__class__(
+                    value=b"".join(bytes(chunk) for chunk in chunks),
+                    bounds=(self._bound_min, self._bound_max),
+                    impl=self.tag,
+                    expl=self._expl,
+                    default=self.default,
+                    optional=self.optional,
+                    _decoded=(offset, llen, vlen + (EOC_LEN if lenindef else 0)),
+                )
+            except DecodeError as err:
+                raise DecodeError(
+                    msg=err.msg,
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            except BoundsError as err:
+                raise DecodeError(
+                    msg=str(err),
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            obj.lenindef = lenindef
+            obj.bered = True
+            return obj, (v[EOC_LEN:] if lenindef else v)
+        raise TagMismatch(
+            klass=self.__class__,
+            decode_path=decode_path,
+            offset=offset,
+        )
+
      def __repr__(self):
          return pp_console_row(next(self.pps()))
  
@@ -2324,12 +2731,17 @@ class OctetString(Obj):
              expl_tlen=self.expl_tlen if self.expled else None,
              expl_llen=self.expl_llen if self.expled else None,
              expl_vlen=self.expl_vlen if self.expled else None,
+            expl_lenindef=self.expl_lenindef,
+            lenindef=self.lenindef,
+            bered=self.bered,
          )
          defined_by, defined = self.defined or (None, None)
          if defined_by is not None:
              yield defined.pps(
                  decode_path=decode_path + (DecodePathDefBy(defined_by),)
              )
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  class Null(Obj):
@@ -2460,7 +2872,10 @@ class Null(Obj):
              expl_tlen=self.expl_tlen if self.expled else None,
              expl_llen=self.expl_llen if self.expled else None,
              expl_vlen=self.expl_vlen if self.expled else None,
+            expl_lenindef=self.expl_lenindef,
          )
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  class ObjectIdentifier(Obj):
@@ -2748,7 +3163,10 @@ class ObjectIdentifier(Obj):
              expl_tlen=self.expl_tlen if self.expled else None,
              expl_llen=self.expl_llen if self.expled else None,
              expl_vlen=self.expl_vlen if self.expled else None,
+            expl_lenindef=self.expl_lenindef,
          )
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  class Enumerated(Integer):
@@ -2966,7 +3384,14 @@ class CommonString(OctetString):
              tlen=self.tlen,
              llen=self.llen,
              vlen=self.vlen,
+            expl_offset=self.expl_offset if self.expled else None,
+            expl_tlen=self.expl_tlen if self.expled else None,
+            expl_llen=self.expl_llen if self.expled else None,
+            expl_vlen=self.expl_vlen if self.expled else None,
+            expl_lenindef=self.expl_lenindef,
          )
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  class UTF8String(CommonString):
@@ -2977,6 +3402,10 @@ class UTF8String(CommonString):
  
  
  class NumericString(CommonString):
+    """Numeric string
+
+    Its value is properly sanitized: only ASCII digits can be stored.
+    """
      __slots__ = ()
      tag_default = tag_encode(18)
      encoding = "ascii"
@@ -3093,11 +3522,14 @@ class UTCTime(CommonString):
          if isinstance(value, datetime):
              return value.strftime(self.fmt).encode("ascii")
          if isinstance(value, binary_type):
-            value_decoded = value.decode("ascii")
+            try:
+                value_decoded = value.decode("ascii")
+            except (UnicodeEncodeError, UnicodeDecodeError) as err:
+                raise DecodeError("invalid UTCTime encoding")
              if len(value_decoded) == LEN_YYMMDDHHMMSSZ:
                  try:
                      datetime.strptime(value_decoded, self.fmt)
-                except ValueError:
+                except (TypeError, ValueError):
                      raise DecodeError("invalid UTCTime format")
                  return value
              else:
@@ -3154,7 +3586,14 @@ class UTCTime(CommonString):
              tlen=self.tlen,
              llen=self.llen,
              vlen=self.vlen,
+            expl_offset=self.expl_offset if self.expled else None,
+            expl_tlen=self.expl_tlen if self.expled else None,
+            expl_llen=self.expl_llen if self.expled else None,
+            expl_vlen=self.expl_vlen if self.expled else None,
+            expl_lenindef=self.expl_lenindef,
          )
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  class GeneralizedTime(UTCTime):
@@ -3184,11 +3623,14 @@ class GeneralizedTime(UTCTime):
                  self.fmt_ms if value.microsecond > 0 else self.fmt
              ).encode("ascii")
          if isinstance(value, binary_type):
-            value_decoded = value.decode("ascii")
+            try:
+                value_decoded = value.decode("ascii")
+            except (UnicodeEncodeError, UnicodeDecodeError) as err:
+                raise DecodeError("invalid GeneralizedTime encoding")
              if len(value_decoded) == LEN_YYYYMMDDHHMMSSZ:
                  try:
                      datetime.strptime(value_decoded, self.fmt)
-                except ValueError:
+                except (TypeError, ValueError):
                      raise DecodeError(
                          "invalid GeneralizedTime (without ms) format",
                      )
@@ -3196,7 +3638,7 @@ class GeneralizedTime(UTCTime):
              elif len(value_decoded) >= LEN_YYYYMMDDHHMMSSDMZ:
                  try:
                      datetime.strptime(value_decoded, self.fmt_ms)
-                except ValueError:
+                except (TypeError, ValueError):
                      raise DecodeError(
                          "invalid GeneralizedTime (with ms) format",
                      )
@@ -3460,7 +3902,7 @@ class Choice(Obj):
              expl=self._expl,
              default=self.default,
              optional=self.optional,
-            _decoded=(offset, 0, value.tlvlen),
+            _decoded=(offset, 0, value.fulllen),
          )
          obj._value = (choice, value)
          return obj, tail
@@ -3485,9 +3927,12 @@ class Choice(Obj):
              tlen=self.tlen,
              llen=self.llen,
              vlen=self.vlen,
+            expl_lenindef=self.expl_lenindef,
          )
          if self.ready:
              yield self.value.pps(decode_path=decode_path + (self.choice,))
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  class PrimitiveTypes(Choice):
@@ -3616,7 +4061,47 @@ class Any(Obj):
      def _decode(self, tlv, offset, decode_path, ctx, tag_only):
          try:
              t, tlen, lv = tag_strip(tlv)
+        except DecodeError as err:
+            raise err.__class__(
+                msg=err.msg,
+                klass=self.__class__,
+                decode_path=decode_path,
+                offset=offset,
+            )
+        try:
              l, llen, v = len_decode(lv)
+        except LenIndefForm as err:
+            if not ctx.get("bered", False):
+                raise err.__class__(
+                    msg=err.msg,
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            llen, vlen, v = 1, 0, lv[1:]
+            sub_offset = offset + tlen + llen
+            chunk_i = 0
+            while v[:EOC_LEN].tobytes() != EOC:
+                chunk, v = Any().decode(
+                    v,
+                    offset=sub_offset,
+                    decode_path=decode_path + (str(chunk_i),),
+                    leavemm=True,
+                    ctx=ctx,
+                )
+                vlen += chunk.tlvlen
+                sub_offset += chunk.tlvlen
+                chunk_i += 1
+            tlvlen = tlen + llen + vlen + EOC_LEN
+            obj = self.__class__(
+                value=tlv[:tlvlen].tobytes(),
+                expl=self._expl,
+                optional=self.optional,
+                _decoded=(offset, 0, tlvlen),
+            )
+            obj.lenindef = True
+            obj.tag = t
+            return obj, v[EOC_LEN:]
          except DecodeError as err:
              raise err.__class__(
                  msg=err.msg,
@@ -3663,12 +4148,16 @@ class Any(Obj):
              expl_tlen=self.expl_tlen if self.expled else None,
              expl_llen=self.expl_llen if self.expled else None,
              expl_vlen=self.expl_vlen if self.expled else None,
+            expl_lenindef=self.expl_lenindef,
+            lenindef=self.lenindef,
          )
          defined_by, defined = self.defined or (None, None)
          if defined_by is not None:
              yield defined.pps(
                  decode_path=decode_path + (DecodePathDefBy(defined_by),)
              )
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  ########################################################################
@@ -3772,7 +4261,7 @@ class Sequence(Obj):
          ("algorithm", ObjectIdentifier("1.2.3")),
          ("parameters", Any(Null()))
      ))
-    AlgorithmIdentifier SEQUENCE[OBJECT IDENTIFIER 1.2.3, ANY 0500 OPTIONAL]
+    AlgorithmIdentifier SEQUENCE[algorithm: OBJECT IDENTIFIER 1.2.3; parameters: ANY 0500 OPTIONAL]
  
      You can determine if value exists/set in the sequence and take its value:
  
@@ -3963,8 +4452,19 @@ class Sequence(Obj):
              )
          if tag_only:
              return
+        lenindef = False
          try:
              l, llen, v = len_decode(lv)
+        except LenIndefForm as err:
+            if not ctx.get("bered", False):
+                raise err.__class__(
+                    msg=err.msg,
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            l, llen, v = 0, 1, lv[1:]
+            lenindef = True
          except DecodeError as err:
              raise err.__class__(
                  msg=err.msg,
@@ -3979,11 +4479,16 @@ class Sequence(Obj):
                  decode_path=decode_path,
                  offset=offset,
              )
-        v, tail = v[:l], v[l:]
+        if not lenindef:
+            v, tail = v[:l], v[l:]
+        vlen = 0
          sub_offset = offset + tlen + llen
          values = {}
          for name, spec in self.specs.items():
-            if len(v) == 0 and spec.optional:
+            if spec.optional and (
+                    (lenindef and v[:EOC_LEN].tobytes() == EOC) or
+                    len(v) == 0
+            ):
                  continue
              sub_decode_path = decode_path + (name,)
              try:
@@ -3999,7 +4504,7 @@ class Sequence(Obj):
                      continue
                  raise
  
-            defined = get_def_by_path(ctx.get("defines", ()), sub_decode_path)
+            defined = get_def_by_path(ctx.get("_defines", ()), sub_decode_path)
              if defined is not None:
                  defined_by, defined_spec = defined
                  if issubclass(value.__class__, SequenceOf):
@@ -4046,7 +4551,9 @@ class Sequence(Obj):
                          )
                      value.defined = (defined_by, defined_value)
  
-            sub_offset += (value.expl_tlvlen if value.expled else value.tlvlen)
+            value_len = value.fulllen
+            vlen += value_len
+            sub_offset += value_len
              v = v_tail
              if spec.default is not None and value == spec.default:
                  if ctx.get("strict_default_existence", False):
@@ -4069,11 +4576,21 @@ class Sequence(Obj):
                  for rel_path, schema in spec_defines:
                      defined = schema.get(value, None)
                      if defined is not None:
-                        ctx.setdefault("defines", []).append((
+                        ctx.setdefault("_defines", []).append((
                              abs_decode_path(sub_decode_path[:-1], rel_path),
                              (value, defined),
                          ))
-        if len(v) > 0:
+        if lenindef:
+            if v[:EOC_LEN].tobytes() != EOC:
+                raise DecodeError(
+                    "no EOC",
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            tail = v[EOC_LEN:]
+            vlen += EOC_LEN
+        elif len(v) > 0:
              raise DecodeError(
                  "remaining data",
                  klass=self.__class__,
@@ -4086,9 +4603,10 @@ class Sequence(Obj):
              expl=self._expl,
              default=self.default,
              optional=self.optional,
-            _decoded=(offset, llen, l),
+            _decoded=(offset, llen, vlen),
          )
          obj._value = values
+        obj.lenindef = lenindef
          return obj, tail
  
      def __repr__(self):
@@ -4098,8 +4616,8 @@ class Sequence(Obj):
              _value = self._value.get(name)
              if _value is None:
                  continue
-            cols.append(repr(_value))
-        return "%s[%s]" % (value, ", ".join(cols))
+            cols.append("%s: %s" % (name, repr(_value)))
+        return "%s[%s]" % (value, "; ".join(cols))
  
      def pps(self, decode_path=()):
          yield _pp(
@@ -4118,12 +4636,16 @@ class Sequence(Obj):
              expl_tlen=self.expl_tlen if self.expled else None,
              expl_llen=self.expl_llen if self.expled else None,
              expl_vlen=self.expl_vlen if self.expled else None,
+            expl_lenindef=self.expl_lenindef,
+            lenindef=self.lenindef,
          )
          for name in self.specs:
              value = self._value.get(name)
              if value is None:
                  continue
              yield value.pps(decode_path=decode_path + (name,))
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  class Set(Sequence):
@@ -4159,8 +4681,19 @@ class Set(Sequence):
              )
          if tag_only:
              return
+        lenindef = False
          try:
              l, llen, v = len_decode(lv)
+        except LenIndefForm as err:
+            if not ctx.get("bered", False):
+                raise err.__class__(
+                    msg=err.msg,
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            l, llen, v = 0, 1, lv[1:]
+            lenindef = True
          except DecodeError as err:
              raise err.__class__(
                  msg=err.msg,
@@ -4174,11 +4707,15 @@ class Set(Sequence):
                  klass=self.__class__,
                  offset=offset,
              )
-        v, tail = v[:l], v[l:]
+        if not lenindef:
+            v, tail = v[:l], v[l:]
+        vlen = 0
          sub_offset = offset + tlen + llen
          values = {}
          specs_items = self.specs.items
          while len(v) > 0:
+            if lenindef and v[:EOC_LEN].tobytes() == EOC:
+                break
              for name, spec in specs_items():
                  sub_decode_path = decode_path + (name,)
                  try:
@@ -4206,9 +4743,9 @@ class Set(Sequence):
                  decode_path=sub_decode_path,
                  ctx=ctx,
              )
-            sub_offset += (
-                value.expl_tlvlen if value.expled else value.tlvlen
-            )
+            value_len = value.fulllen
+            sub_offset += value_len
+            vlen += value_len
              v = v_tail
              if spec.default is None or value != spec.default:  # pragma: no cover
                  # SeqMixing.test_encoded_default_accepted covers that place
@@ -4219,9 +4756,26 @@ class Set(Sequence):
              expl=self._expl,
              default=self.default,
              optional=self.optional,
-            _decoded=(offset, llen, l),
+            _decoded=(offset, llen, vlen + (EOC_LEN if lenindef else 0)),
          )
          obj._value = values
+        if lenindef:
+            if v[:EOC_LEN].tobytes() != EOC:
+                raise DecodeError(
+                    "no EOC",
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            tail = v[EOC_LEN:]
+            obj.lenindef = True
+        if not obj.ready:
+            raise DecodeError(
+                "not all values are ready",
+                klass=self.__class__,
+                decode_path=decode_path,
+                offset=offset,
+            )
          return obj, tail
  
  
@@ -4423,8 +4977,19 @@ class SequenceOf(Obj):
              )
          if tag_only:
              return
+        lenindef = False
          try:
              l, llen, v = len_decode(lv)
+        except LenIndefForm as err:
+            if not ctx.get("bered", False):
+                raise err.__class__(
+                    msg=err.msg,
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            l, llen, v = 0, 1, lv[1:]
+            lenindef = True
          except DecodeError as err:
              raise err.__class__(
                  msg=err.msg,
@@ -4439,11 +5004,15 @@ class SequenceOf(Obj):
                  decode_path=decode_path,
                  offset=offset,
              )
-        v, tail = v[:l], v[l:]
+        if not lenindef:
+            v, tail = v[:l], v[l:]
+        vlen = 0
          sub_offset = offset + tlen + llen
          _value = []
          spec = self.spec
          while len(v) > 0:
+            if lenindef and v[:EOC_LEN].tobytes() == EOC:
+                break
              value, v_tail = spec.decode(
                  v,
                  sub_offset,
@@ -4451,7 +5020,9 @@ class SequenceOf(Obj):
                  decode_path=decode_path + (str(len(_value)),),
                  ctx=ctx,
              )
-            sub_offset += (value.expl_tlvlen if value.expled else value.tlvlen)
+            value_len = value.fulllen
+            sub_offset += value_len
+            vlen += value_len
              v = v_tail
              _value.append(value)
          obj = self.__class__(
@@ -4462,8 +5033,18 @@ class SequenceOf(Obj):
              expl=self._expl,
              default=self.default,
              optional=self.optional,
-            _decoded=(offset, llen, l),
+            _decoded=(offset, llen, vlen + (EOC_LEN if lenindef else 0)),
          )
+        if lenindef:
+            if v[:EOC_LEN].tobytes() != EOC:
+                raise DecodeError(
+                    "no EOC",
+                    klass=self.__class__,
+                    decode_path=decode_path,
+                    offset=offset,
+                )
+            obj.lenindef = True
+            tail = v[EOC_LEN:]
          return obj, tail
  
      def __repr__(self):
@@ -4489,9 +5070,13 @@ class SequenceOf(Obj):
              expl_tlen=self.expl_tlen if self.expled else None,
              expl_llen=self.expl_llen if self.expled else None,
              expl_vlen=self.expl_vlen if self.expled else None,
+            expl_lenindef=self.expl_lenindef,
+            lenindef=self.lenindef,
          )
          for i, value in enumerate(self._value):
              yield value.pps(decode_path=decode_path + (str(i),))
+        for pp in self.pps_lenindef(decode_path):
+            yield pp
  
  
  class SetOf(SequenceOf):
@@ -4572,7 +5157,7 @@ def generic_decoder():  # pragma: no cover
  
  def main():  # pragma: no cover
      import argparse
-    parser = argparse.ArgumentParser(description="PyDERASN ASN.1 DER decoder")
+    parser = argparse.ArgumentParser(description="PyDERASN ASN.1 BER/DER decoder")
      parser.add_argument(
          "--skip",
          type=int,
@@ -4591,6 +5176,11 @@ def main():  # pragma: no cover
          "--defines-by-path",
          help="Python path to decoder's defines_by_path",
      )
+    parser.add_argument(
+        "--nobered",
+        action='store_true',
+        help="Disallow BER encoding",
+    )
      parser.add_argument(
          "DERFile",
          type=argparse.FileType("rb"),
@@ -4607,13 +5197,10 @@ def main():  # pragma: no cover
          pprinter = partial(pprint, big_blobs=True)
      else:
          schema, pprinter = generic_decoder()
-    obj, tail = schema().decode(
-        der,
-        ctx=(
-            None if args.defines_by_path is None else
-            {"defines_by_path": obj_by_path(args.defines_by_path)}
-        ),
-    )
+    ctx = {"bered": not args.nobered}
+    if args.defines_by_path is not None:
+        ctx["defines_by_path"] = obj_by_path(args.defines_by_path)
+    obj, tail = schema().decode(der, ctx=ctx)
      print(pprinter(
          obj,
          oids=oids,