#!/usr/bin/env python
# This file should be available from
# http://www.pobox.com/~asl2/software/PyZ3950/
# and is licensed under the X Consortium license:
# Copyright (c) 2001, Aaron S. Lav, asl2@pobox.com
# All rights reserved.
# Permission is hereby granted, free of charge, to any person obtaining a
# copy of this software and associated documentation files (the
# "Software"), to deal in the Software without restriction, including
# without limitation the rights to use, copy, modify, merge, publish,
# distribute, and/or sell copies of the Software, and to permit persons
# to whom the Software is furnished to do so, provided that the above
# copyright notice(s) and this permission notice appear in all copies of
# the Software and that both the above copyright notice(s) and this
# permission notice appear in supporting documentation.
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
# OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT
# OF THIRD PARTY RIGHTS. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR
# HOLDERS INCLUDED IN THIS NOTICE BE LIABLE FOR ANY CLAIM, OR ANY SPECIAL
# INDIRECT OR CONSEQUENTIAL DAMAGES, OR ANY DAMAGES WHATSOEVER RESULTING
# FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT,
# NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION
# WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
# Except as contained in this notice, the name of a copyright holder
# shall not be used in advertising or otherwise to promote the sale, use
# or other dealings in this Software without prior written authorization
# of the copyright holder.
# Change history:
# 2001/9/22 - fix test code to be slightly more elegant and fix test
# comments to be correct. Due to Roy Smith, roy.smith@micromuse.com
# 2002/05/23 - fix handling of ANY. Needed for handling of SUTRS records
# by Z3950.
"""
asn1 is a relatively general-purpose ASN.1 BER encoder and decoder.
Encoding and
decoding functions (asn1.encode and asn1.decode) take an ASN.1 spec, and
transform back and forth between a byte stream and what I consider a natural
Python representation of the data.
Separating the ASN.1 specification from the code would allow
compilation of the specification to inline Python or C code, or to a
specification for a C-based engine.
This module supports the following ASN.1 types:
- BOOLEAN - encoder takes any Python value, decoder produces 0 or 1
- INTEGER - as in Python
- BITSTRING - asn1.BitStringVal
- OCTSTRING - Python string
- NULL - ignore value on encoding, return None on decoding
- REAL - asn1.REAL (I hope to make this look more like python floats someday: read the source if you need this)
- OID - OidVal
- EXTERNAL - as SEQUENCE, see below (or read the source)
- all string types - Python string (no validity checking is done)
For all the above types, the ASN.1 spec is just the name of the type.
Inherently constructed types:
- SEQUENCE_OF (ASN1.spec) - Python representation is a list of values.
-
SEQUENCE, CHOICE - the ASN.1 spec is a list of tuples, either (name, tag, type)
or, for SEQUENCE, (name, tag, type, optionalflag), where:
tag can be None, asn1.EXPLICIT(tag), asn1.IMPLICIT(tag), or an integer
interpreted as either an explicit or an implicit tag according to the setting
of asn1.implicit_default; type is recursively an ASN.1 spec.
For CHOICE, the Python representation is (name, val). For SEQUENCE, on
decoding,
the Python representation is an instance of an asn1-synthesized class.
On encoding, any class with the appropriate attributes is acceptable,
calling the SEQUENCE specification but you
can obtain a fresh instance of the synthesized class by calling the SEQUENCE
specification: this class overrides setattr to provide attribute-name error
checking. (The rationale for the seemingly unPythonic errorchecking is that
misspelled optional attributes would otherwise be hard to detect. If you don't
like it, it should be easy to turn off.)
The definition of enumerated values for INTEGER and BITSTRING types is
supported via the compiler (or see their definitions). For
BITSTRING types, __getitem__ (value_name) and __setitem__
(value_name) are implemented as BitStringVal methods, allowing,
e.g., bitstringval['version_1'] = 1
, or
if bitstringval['version_1']
. An appropriate BitStringVal for
encoding can be constructed by calling the specification.
For INTEGER types, call get_num_from_name (name)
or
get_name_from_num(num)
methods of the type specification.
(Note that code like if val == defn.get_num_from_name ('failure'):
is less prone to typo-induced errors than if
failure' == defn.get_name_from_num (val):
In order to obtain definitions nested inside other definitions
(e.g. INTEGER and BITSTRING, above), __getitem__ methods are provided
for SEQUENCE, CHOICE, and SEQUENCE_OF. For SEQUENCE and CHOICE, the
key is the name of the sequence element or arm (respectively).
For SEQUENCE_OF, the key is 0 (arbitrarily chosen).
APPLICATION and PRIVATE class tags are supported via the compiler,
or pass the cls=
keyword to IMPLICIT or EXPLICIT.
For examples, see the test code at the end of this file, or the
Z39.50 code that should be distributed with this file as part of PyZ3950.
There is not yet support for:
- UTCTime, SET, SET OF, or some more obscure types
Useful ASN.1 references:
"""
from __future__ import nested_scopes
vers = "0.83"
import array
import string
import copy
import math
# - elements should expose a list of possible tags, instead of just one tag,
# bringing CHOICE into line with other elements
# - make test cases more comprehensive
# - write test cases for INTEGER and BITSTRING enum. values
# - write test cases for asst. character set encodings
# Parameters you can tweak for BER encoding
implicit_default = 1
# Treat bare numeric tags as IMPLICIT if 1, EXPLICIT if 0. Set at
# definition time. This requires that all ASN.1 definitions be done
# single-threadedly - no big deal. It'd be somewhat more modular to
# look this up in the caller's module dictionary. The compiler produces
# explicit indications of whether a tag is EXPLICIT or IMPLICIT, so is
# unaffected by this setting.
indef_len_encodings = 0
# Generate indefinite-length encodings whenever we'd otherwise have to
# go back and fix up the length bytes if length octets were 1-byte long.
# Set at encoding time. Might make encoding run a little faster.
cons_encoding = 0
# Generate constructed encodings for string types. Useful only for
# testing the decoding of such encodings, I think.
# In theory, indef_len_encodings and cons_encoding are designed for
# cases where the length of the data isn't known ahead of time, and
# one doesn't want to have to buffer the entire thing. It is possible
# to pass lazy sequences into the appropriate functions, but ...
# For debugging the asn.1 code only
trace_seq = 0
trace_choice = 0
trace_tag = 0
trace_seq_of = 0
trace_int = 0
trace_external = 0
trace_byte = 0
trace_bitstring = 0
trace_string = 0
trace_codec = 0
# Note: BERError is only for decoding errors (either input data is illegal
# BER, or input data is legal BER but we don't support it.)
# call encode_per and decode_per for PER? Or check Ctx?
class BERError (Exception): pass
class EncodingError (Exception): pass
# Neither of these provides support for character set codecs. Instantiate
# the appropriate context and call set_codec for the set of string types
# you need with appropriate codecs.
def encode (spec, data):
ctx = Ctx ()
spec.encode (ctx, data)
return ctx.get_data ()
def decode (spec, buf, readproc = None):
ctx = IncrementalDecodeCtx(spec)
ctx.feed (buf)
while ctx.val_count () == 0:
ctx.feed (readproc ())
rv = ctx.get_first_decoded ()
# decode also ignores the possibility of leftover bytes.
# use IncrementalDecodeCtx.get_bytes_inprocess_count if you
# need to know about leftovers
return rv
UNIVERSAL_FLAG = 0
APPLICATION_FLAG = 0x40
CONTEXT_FLAG = 0x80
PRIVATE_FLAG = 0xC0
CONS_FLAG = 0x20
ANY_TAG = -1 # pseudotag
END_INDEF_CONS_TAG = 0x0
BOOL_TAG = 0x1
INT_TAG = 0x2
BITSTRING_TAG = 0x3
OCTSTRING_TAG = 0x4
NULL_TAG = 0x5
OID_TAG = 0x6
OBJECTDESCRIPTOR_TAG = 0x7
EXTERNAL_TAG = 0x8
REAL_TAG = 0x9
SEQUENCE_TAG = 0x10
UTF8STRING_TAG = 0xC
NUMERICSTRING_TAG = 0x12
PRINTABLESTRING_TAG = 0x13
T61STRING_TAG = 0x14
VIDEOTEXSTRING_TAG = 0x15
IA5STRING_TAG = 0x16
GENERALIZEDTIME_TAG = 0x18
GRAPHICSTRING_TAG = 0x19
VISIBLESTRING_TAG = 0x1A
GENERALSTRING_TAG = 0x1B
UNIVERSALSTRING_TAG = 0x1C
BMPSTRING_TAG = 0x1E
class StructBase:
# replace _allowed_attrib_list with __slots__ mechanism
# once we no longer need to support Python 2.1
_allowed_attrib_list = []
def __init__ (self, **kw):
self.set_allowed_attribs (self._allowed_attrib_list)
# we don't just self.__dict__.update (...) b/c
# we want error-checking in setattr below
for k, v in kw.items ():
setattr (self, k, v)
def __repr__ (self):
s = 'Struct: %s [\n' % (self.__class__)
i = self.__dict__.items ()
i.sort ()
i = filter (lambda it: it[0][0] <> '_', i)
s = s + string.join (map (lambda it: repr (it[0]) +
' ' + repr (it[1]), i), '\n')
s = s + ']\n'
return s
def __cmp__ (self, other):
keys = self.__dict__.keys ()
keys.sort () # to ensure reproduciblity
for k in keys:
s = getattr (self, k, None)
o = getattr (other, k, None)
def is_seq (val):
return (isinstance (val, type ((0,))) or
isinstance (val, type ([])))
if is_seq (s) and is_seq (o):
if len (s) <> len (o):
return -1
for selt, oelt in zip (s, o):
c = cmp (selt, oelt)
if c <> 0:
return c
else:
c = cmp (s, o)
if c <> 0:
return c
okeys = other.__dict__.keys ()
okeys.sort ()
if okeys <> keys:
return 1
return 0
def set_allowed_attribs (self, l):
self._allowed_attribs = {}
for e in l:
self._allowed_attribs [e] = 1
def is_allowed (self, k):
if self._allowed_attrib_list == []: return 1
if k == '_allowed_attribs': return 1
return self._allowed_attribs.has_key (k)
# I implemented setattr b/c otherwise it can be difficult to tell when one
# has mistyped an OPTIONAL element of a SEQUENCE. This is probably a matter
# of taste, and derived classes should feel welcome to override this.
def __setattr__ (self, key, val):
if not self.is_allowed (key):
raise AttributeError (key)
self.__dict__ [key] = val
# tags can match if only constructedness of encoding is different. Not
# quite right, since, e.g., SEQUENCE must always be a constructed type,
# and INTEGER never is, but this is OK because once we've matched,
# trying to decode an obligate cons. type with a noncons tag will fail
# because there's no decode_val attribute, and the other mismatch
# will fail because there's no start_cons attribute.
# This isn't a problem in CHOICEs because the uniqueness requirements
# are expressed in terms of numeric tags, regardless of cons flag.
def match_tag (a, b):
if trace_tag: print "Match_tag", a, b
cons_match = (a[0] & ~CONS_FLAG == b[0] & ~CONS_FLAG)
if (a[1] == ANY_TAG or b[1] == ANY_TAG):
return cons_match
return a[1] == b[1] and cons_match
def encode_base128 (val):
if val == 0:
return [0x00]
l = []
while val:
l.append ((val % 128) | 0x80)
val = val / 128
if len (l) > 0:
l[0] = l[0] & 0x7F
l.reverse ()
return l
def read_base128 (buf, start):
val = 0
while 1:
b = buf [start]
start += 1
val = val * 128 + (b & 0x7F)
if b & 0x80 == 0:
break
return (start, val)
class CtxBase:
"""Charset codec functionality, shared among all contexts."""
def __init__ (self):
self.charset_switch_oids = {}
self.codec_dict_stack = [{}]
# We may need different codecs for differing string types, e.g.
# VisibleString vs. UTF8String, thus the dict
def register_charset_switcher (self, oid, fn):
self.charset_switch_oids [oid] = fn
def set_codec (self, defn_inst, codec, strip_bom = 0):
if trace_codec:
print "setting codec", defn_inst, codec, strip_bom
print self.codec_dict_stack
# Note: really only need [0] and [1] elements of codec, encoder and decoder
self.codec_dict_stack[-1][defn_inst.base_tag] = (codec, strip_bom)
def get_codec (self, base_tag):
def default_enc (x):
if isinstance (x, type (u"")):
return (x.encode ('ascii'), 0)
return (x, 0)
identity = ((default_enc, lambda x:(x,0)), 0)
# we ignore lengths consumed. I don't think this means
# we miss out on any error checking, b/c if there were
# a stray pad byte or something, the codec would complain
# about truncation.
return self.codec_dict_stack[-1].get (base_tag, identity)
def get_enc (self, base_tag):
t = self.get_codec (base_tag)
return (t[0][0], t[1])
def get_dec (self, base_tag):
return self.get_codec (base_tag)[0][1]
def push_codec (self):
if trace_codec:
print "pushing codec"
self.codec_dict_stack.append ({})
def pop_codec (self):
if trace_codec:
print "popping codec"
self.codec_dict_stack.pop ()
class IncrementalDecodeCtx(CtxBase):
states = ["tag_first", "tag_rest", "len_first", "len_rest", "data",
"indef_end"]
class StackElt:
def __init__ (self, start_offset, cur_len, parent_typ, tag,
parent_ctx, cname = None):
self.start_offset = start_offset
self.len = cur_len
self.cname = cname
self.cons = parent_typ.start_cons (tag, cur_len, parent_ctx)
# methods: get_cur_def (), handle_val (val), finish ()
def __init__ (self, asn1_def):
CtxBase.__init__ (self)
self.offset = 0
self.last_begin_offset = 0
self.state = "tag_first"
self.asn1_def = asn1_def
self.decoded_vals = []
self.stack = []
self.state_fns = {}
for state in self.states:
self.state_fns [state] = getattr (self, 'feed_' + state)
def get_bytes_inprocess_count (self):
return self.offset - self.last_begin_offset
def val_count (self):
l = len (self.decoded_vals)
return l
def get_first_decoded (self):
rv = self.decoded_vals [0]
self.decoded_vals = self.decoded_vals [1:]
return rv
def get_cur_def (self):
if len (self.stack) == 0:
return self.asn1_def
else:
tos = self.stack [-1]
return tos.cons.get_cur_def (self.decoded_tag)
def match_tag (self, seen):
typ = self.get_cur_def ()
# Note: use 'is' instead of '=' to avoid problem w/
# OCTSTRING_class wanting __eq__ and failing b/c of getattr
if typ is None: # falling off end of SEQUENCE with optional bits
return 0
return typ.check_tag (seen)
# XXX calling check_tag is inefficient for SEQUENCE and CHOICE,
# b/c we have to iterate to check_tag, then use the tag again
# to figure out what type to decode.
def set_state (self, new_state):
self.state = new_state
def push (self, decoded_len):
new_typ = self.get_cur_def ()
cname = None
if isinstance (new_typ, CHOICE):
(cname, new_typ) = new_typ.check_tag (self.decoded_tag)
self.stack.append (self.StackElt (self.offset, decoded_len, new_typ,
self.decoded_tag, self,
cname = cname))
def pop (self):
if len (self.stack) == 0:
self.raise_error ("bad end of cons type")
tos = self.stack.pop ()
if tos.len <> None:
if tos.len <> (self.offset - tos.start_offset):
self.raise_error ("constructed len mismatch (%d %d %d)" %
(tos.len, self.offset, tos.start_offset))
val = tos.cons.finish ()
if tos.cname <> None:
val = (tos.cname, val)
self.handle_decoded (val)
def raise_error (self, descr):
raise BERError (descr + " offset %d" % (self.offset,))
def feed (self, data):
for char in data:
if trace_byte:
print hex (char), self.state, "offset:", self.offset
self.state_fns [self.state] (char)
self.offset += 1
def feed_tag_first (self, char):
if char == 0x00:
stacklen = len (self.stack)
if stacklen == 0 or self.stack[-1].len <> None:
if stacklen == 0:
tos_len_str = "irrelevant"
else:
tos_len_str = str (self.stack[-1].len)
self.raise_error ("0x00 tag found, stacklen %d tos len %s" %
(stacklen, tos_len_str))
self.set_state ("indef_end")
return
flags = char & 0xE0
val = char & 0x1f
self.decoded_tag = (flags, val)
if val == 0x1f:
self.set_state ("tag_rest")
self.tag_accum = 0
else:
self.finish_tag ()
def feed_tag_rest (self, char):
self.tag_accum = self.tag_accum * 128 + (char & 0x7f)
if char & 0x80 == 0:
self.decoded_tag = (self.decoded_tag[0], self.tag_accum)
self.tag_accum = None
self.finish_tag ()
def finish_tag (self):
if not self.match_tag (self.decoded_tag):
self.raise_error ("Saw tag %s expecting %s" %
(str(self.decoded_tag),
self.get_cur_def().str_tag ()))
self.set_state ("len_first")
def feed_len_first (self, char):
if char >= 128:
rest_len = char & 0x7f
if rest_len == 0:
self.decoded_len = None
self.finish_len ()
else:
self.rest_len = rest_len
self.decoded_len = 0
self.set_state ("len_rest")
else:
self.decoded_len = char
self.finish_len ()
def feed_len_rest (self, char):
self.decoded_len = self.decoded_len * 256 + char
self.rest_len -= 1
if self.rest_len == 0:
self.finish_len ()
def finish_len (self):
if self.decoded_tag == (0,0):
if self.decoded_len <> 0:
self.raise_error ("Bad len %d for tag 0" % (self.decoded_len,))
self.pop ()
return
self.data_buf = []
cons_flag = self.decoded_tag [0] & CONS_FLAG
if cons_flag:
self.push (self.decoded_len)
new_state = "tag_first"
else:
new_state = "data"
if self.decoded_len == 0:
if cons_flag:
assert (self.check_pop ())
self.set_state ("tag_first")
else:
self.finish_data ()
else:
self.set_state (new_state)
def feed_data (self, char):
self.data_buf.append (char)
self.decoded_len -= 1
if self.decoded_len == 0:
self.finish_data ()
def finish_data (self):
cur_def = self.get_cur_def ()
if isinstance (cur_def, CHOICE):
(cname, ctyp) = cur_def.check_tag (self.decoded_tag)
cur_def = ctyp
else:
cname = None
if not (cur_def is None): # we haven't fallen off end of a SEQ
rv = cur_def.decode_val (self, self.data_buf)
if cname <> None:
rv = (cname, rv)
self.handle_decoded (rv)
else:
assert (self.check_pop ())
self.set_state ("tag_first")
def handle_decoded (self, val):
if len (self.stack) == 0:
self.decoded_vals.append (val)
self.last_begin_offset = self.offset + 1
# +1 because self.offset will be incremented on return
else:
self.stack[-1].cons.handle_val (val)
self.check_pop ()
def check_pop (self):
if self.stack[-1].len == self.offset - self.stack[-1].start_offset:
self.pop ()
return 1
return 0
def feed_indef_end (self, char):
if char <> 0x00:
self.raise_error ("end cons indef-len encoding %x" % (char,))
self.pop ()
self.set_state ("tag_first")
def tag_to_buf (tag, orig_flags = None):
(flags, val) = tag
# Constructed encoding is property of original tag, not of
# implicit tag override
if orig_flags <> None:
flags = flags | (orig_flags & CONS_FLAG)
extra = 0
if val >=0x1F:
extra = val
val = 0x1F
l = [flags | val]
if extra:
l2 = encode_base128 (extra)
l.extend (l2)
return l
def len_to_buf (mylen):
if mylen < 128:
return [mylen]
else:
l = []
while mylen:
l.append (mylen % 256)
mylen = mylen / 256
assert (len (l) < 0x80)
l.append (len (l) | 0x80)
l.reverse ()
return l
class WriteCtx (CtxBase):
def __init__ (self):
CtxBase.__init__ (self)
self.clear ()
def clear (self):
self.buf = array.array ('B')
def encode (self, spec, data):
self.clear ()
spec.encode (self, data)
return self.get_data ()
def get_data (self):
return self.buf
def bytes_write (self, data):
# type-checking is icky but required by array i/f
if isinstance (data, type ([])):
self.buf.fromlist (data)
elif isinstance (data, type ('')):
self.buf.fromstring (data)
else:
raise EncodingError, "Bad type to bytes_write"
BYTE_BITS = 8
def extract_bits (val, lo_bit, hi_bit):
tmp = (val & (~0L << (lo_bit))) >> lo_bit
tmp = tmp & ((1L << (hi_bit - lo_bit + 1)) - 1)
return tmp
log_of_2 = math.log (2)
def log2 (x):
return int(math.log (x) / log_of_2)
class PERWriteCtx(WriteCtx):
def __init__ (self, aligned = 0, canonical = 0):
self.aligned = aligned
self.canonical = canonical
self.bit_offset = 0
WriteCtx.__init__ (self)
def write_bits_unaligned (self, val, bit_len):
# write starting at bit_offset, no matter what
byte_count = (bit_len + self.bit_offset) / BYTE_BITS
if (bit_len + self.bit_offset) % BYTE_BITS <> 0:
byte_count += 1
my_range = range (byte_count - 1, -1, -1)
lo_bits = map (lambda x: x * BYTE_BITS, my_range)
def extract_val (lo_bit):
return extract_bits (val, lo_bit, lo_bit + BYTE_BITS - 1)
bytes = map (extract_val, lo_bits)
new_bit_offset = (bit_len + self.bit_offset) % BYTE_BITS
if new_bit_offset <> 0:
bytes [-1] = bytes [-1] << (BYTE_BITS - new_bit_offset)
if self.bit_offset <> 0:
self.buf[-1] = self.buf[-1] | bytes [0]
self.bytes_write (bytes[1:])
else:
self.bytes_write (bytes)
self.bit_offset = new_bit_offset
def write_bits (self, val, bit_len):
if self.aligned and self.bit_offset <> 0:
self.write_bits_unaligned (0, BYTE_BITS - self.bit_offset)
self.bit_offset = 0
self.write_bits_unaligned (val, bit_len)
# for {read,write}_*_int, see Dubuisson 20.4
def write_constrained_int (self, val, lo, hi):
assert (hi >= lo)
# XXX what if hi = lo + 1
rng = hi - lo + 1
print rng, val, log2(rng)
if not self.aligned:
self.write_bits (val, log2(rng))
return
if rng == 1:
return # known value, don't encode
if rng < 256:
return # calc minimum # of bits
if rng == 256:
self.write_bits (val - lo, 8)
return
if rng <= 65536:
self.write_bits (val - lo, 16)
return
assert (0)
def write_semiconstrained_int (self, val, lo):
# write len field, then len, then min octets log_256(val-lo)
assert (0)
pass
def write_unconstrained_int (self, val): # might have upper bd, but not used
assert (0)
pass
def write_usually_small_int (self, val):
assert (val >= 0)
if val < 64:
self.write_bits_unaligned (0, 1)
self.write_bits_unaligned (val, 6)
else:
self.write_bits_unaligned (1,1)
self.write_semiconstrained_int (val, 0)
class BERWriteCtx(WriteCtx):
def __init__ (self):
WriteCtx.__init__ (self)
def clear (self):
self.cur_tag = None
WriteCtx.clear (self)
def set_implicit_tag (self, tag):
if self.cur_tag == None:
self.cur_tag = tag
def tag_write (self, tag):
if trace_tag: print "Writing tag", tag
(orig_flags, _) = tag
if self.cur_tag <> None:
tag = self.cur_tag
self.cur_tag = None
l = tag_to_buf (tag, orig_flags)
self.bytes_write (l)
def get_pos (self):
return len (self.buf)
class LenPlaceHolder:
def __init__ (self, ctx, estlen = 127):
if not indef_len_encodings:
self.ctx = ctx
self.oldpos = ctx.get_pos ()
self.estlen = estlen
self.lenlen = ctx.est_len_write (estlen)
else:
self.ctx = ctx
ctx.bytes_write ([0x80])
def finish (self):
if not indef_len_encodings:
real_len = self.ctx.get_pos() - self.oldpos - 1
self.ctx._len_write_at (self.ctx.get_pos () - self.oldpos - 1,
self.oldpos, self.lenlen)
else:
self.ctx.bytes_write ([0,0])
def len_write (self, mylen = 0):
return Ctx.LenPlaceHolder (self, mylen)
def len_write_known (self, mylen):
return self.est_len_write (mylen)
def est_len_write (self, mylen):
l = len_to_buf (mylen)
self.buf.fromlist (l)
return len (l)
def _len_write_at (self, mylen, pos, lenlen):
l = len_to_buf (mylen)
assert (len(l) >= lenlen)
# array.pop not available in Python 1.5.2. We could just use a
# less efficient length encoding (long form w/leading 0 bytes
# where necessary), but ...
# XXX fix to use more efficient code, now that we don't support 1.5.2!
for i in range (len(l) - lenlen):
self.buf.insert (pos, 0)
for i in range(len(l)):
self.buf[pos + i] = l [i]
def raise_error (self, descr):
offset = len (self.buf)
raise BERError, (descr, offset)
Ctx = BERWriteCtx # Old synonym for historical reasons
# EXPLICIT, IMPLICIT, CHOICE can't derive from eltbase b/c they need to do
# tag manipulation
class ELTBASE:
# known_len is 1 if len can easily be calculated w/o encoding
# val (e.g. OCTET STRING),
# 0 if otherwise and we have to go back and fix up (e.g. SEQUENCE).
def encode (self, ctx, val):
ctx.tag_write (self.tag)
if not self.known_len: lph = ctx.len_write ()
self.encode_val (ctx, val)
if not self.known_len: lph.finish ()
def check_tag (self, seen_tag):
return match_tag (seen_tag, self.tag)
def str_tag (self):
if hasattr (self, 'tag'):
return str (self.tag)
else:
return self.__class__.__name__
def fulfill_promises (self, promises):
return
class TAG: # base class for IMPLICIT and EXPLICIT
def __init__ (self, tag, cls=CONTEXT_FLAG):
if type (tag) == type (0):
tag = (CONTEXT_FLAG, tag)
self.tag = (tag[0] | self.flags, tag[1])
def set_typ (self, typ):
self.typ = typ
def __call__ (self):
return self.typ ()
def __getitem__ (self, *args):
return self.typ.__getitem__ (*args)
def __setitem__ (self, *args):
return self.typ.__setitem__ (*args)
def get_num_from_name (self, *args):
return self.typ.get_num_from_name (*args)
def get_name_from_num (self, *args):
return self.typ.get_name_from_num (*args)
def decode_val (self, ctx, buf):
return self.typ.decode_val (ctx, buf)
def str_tag (self):
return str (self.tag)
def check_tag (self, seen_tag):
return match_tag (seen_tag, self.tag)
def fulfill_promises (self, promises):
if isinstance (self.typ, Promise):
self.typ = self.typ.get_promised (promises)
else:
self.typ.fulfill_promises (promises)
# Note: IMPLICIT and EXPLICIT have dual use: they can be instantiated by
# users of this module to indicate tagging, but when TAG.set_typ is
# called, they become asn.1 type descriptors themselves. Maybe these
# two uses should have separate classes, making four classes overall.
class IMPLICIT(TAG):
flags = 0
def __repr__ (self):
return "IMPLICIT: " + repr (self.tag) + " " + repr (self.typ)
def __cmp__ (self, other):
if not isinstance (other, IMPLICIT):
return -1
return cmp (self.tag, other.tag)
def start_cons (self, tag, cur_len, ctx):
return self.typ.start_cons (tag, cur_len, ctx)
def encode (self, ctx, val):
ctx.set_implicit_tag (self.tag)
self.typ.encode (ctx, val)
def encode_per (self, ctx, val):
self.typ.encode_per (ctx, val)
class EXPLICIT (TAG):
flags = CONS_FLAG # Explicit tag is always a constructed encoding
def __repr__ (self):
return "EXPLICIT: " + repr (self.tag) + " " + repr (self.typ)
def __cmp__ (self, other):
if not isinstance (other, EXPLICIT):
return -1
return cmp (self.tag, other.tag)
class ConsElt:
def __init__ (self, typ):
self.typ = typ
self.ind = 0
def get_cur_def (self, seen_tag):
return self.typ
def handle_val (self, val):
self.tmp = val
self.ind += 1
def finish (self):
if self.ind <> 1:
raise BERError ("wrong number of elts %d for EXPLICIT %s" %
(self.ind, self.typ))
return self.tmp
def start_cons (self, tag, cur_len, ctx):
return self.ConsElt (self.typ)
def encode (self, ctx, val):
ctx.cur_tag = None
ctx.tag_write (self.tag)
lph = ctx.len_write ()
self.typ.encode (ctx, val)
lph.finish ()
def make_tag (tag):
if implicit_default:
return IMPLICIT (tag)
else:
return EXPLICIT (tag)
def TYPE (tag, typ):
if tag == None:
return typ
if not isinstance (tag, TAG):
tag = make_tag (tag)
tag.set_typ (typ)
return tag
class OidVal:
def __init__ (self, lst):
self.lst = tuple (lst)
self.encoded = self.encode (lst)
def __hash__ (self):
return hash (self.lst)
def __repr__ (self):
s = 'OID:'
for i in self.lst:
s = s + ' %d' % i
return s
def __cmp__ (self, other):
if not hasattr (other, 'lst'):
return -1
return cmp (self.lst, other.lst)
def encode (self, lst):
encoded = [40 * lst [0] + lst [1]]
for val in lst [2:]:
encoded = encoded + encode_base128 (val)
return encoded
class OID_class (ELTBASE):
tag = (0, OID_TAG)
known_len = 1
def encode_val (self, ctx, val):
ctx.len_write_known (len (val.encoded))
ctx.bytes_write (val.encoded)
def decode_val (self, ctx, buf):
b1 = buf [0]
oid = [b1 / 40, b1 % 40]
start = 1
mylen = len (buf)
while start < mylen:
(start, val) = read_base128 (buf, start)
oid.append (val)
return OidVal (oid)
OID = OID_class ()
# XXX need to translate into offset in list for PER encoding
class NamedBase:
def __init__ (self, names_list = [], lo = None, hi = None):
self.lo = lo
self.hi = hi
if names_list == None:
names_list = []
self.name_to_num = {}
self.num_to_name = {}
self.names_list = names_list
for (name, num) in names_list:
self.num_to_name [num] = name
self.name_to_num [name] = num
num_keys = self.num_to_name.keys ()
if len (num_keys) > 0:
self.max = max (self.num_to_name.keys ())
else:
self.max = 0
def get_num_from_name (self, *args):
return self.name_to_num.get (*args)
def get_name_from_num (self, *args):
return self.num_to_name.get (*args)
class INTEGER_class (ELTBASE, NamedBase):
tag = (0, INT_TAG)
known_len = 1
def __init__ (self, *args):
NamedBase.__init__ (self, *args)
if self.max <> 0:
self.hi = self.max # XXX reorganize!
self.extensible = 0 # XXX
def encode_val (self, ctx, val):
# based on ber.py in pysnmp
l = []
if val == 0:
l = [0]
elif val == -1:
l = [0xFF]
else:
if sgn (val) == -1:
term_cond = -1
last_hi = 1
else:
term_cond = 0
last_hi = 0
while val <> term_cond:
val, res = val >> 8, (val & 0xFF)
l.append (res)
if (l[-1] & 0x80 <> 0) ^ last_hi:
l.append (last_hi * 0xFF)
ctx.len_write_known (len(l))
l.reverse ()
ctx.bytes_write (l)
def encode_per (self, ctx, val):
assert (not self.extensible)
assert (self.lo <> None)
print "encoding", val, self.lo, self.hi
if self.hi == None:
ctx.write_semiconstrained_int (val, self.lo)
else:
ctx.write_constrained_int (val, self.lo, self.hi)
def decode_val (self, ctx, buf):
val = 0
if buf[0] >= 128: sgn = -1
else: sgn = 1
for b in buf:
if trace_int: print "Reading INTEGER byte", b
val = 256 * val + sgn * b
if sgn == -1:
val = - (val + pow (2, 8 * len (buf)))
# XXX should be much more efficient decoder here
return val
INTEGER = INTEGER_class ()
class ConditionalConstr:
def __getattr__ (self, attr): # XXX replace with properties when can require 2.2.
if attr == 'tag':
base_tag = self.__dict__ ['base_tag']
if cons_encoding:
return (CONS_FLAG, base_tag)
else:
return (0, base_tag)
elif attr == 'known_len' and self.override_known_len:
return not cons_encoding
else:
return self.__dict__ [attr]
class OCTSTRING_class (ConditionalConstr, ELTBASE):
def __init__ (self, tag = None, lo = None, hi = None):
if tag <> None:
self.base_tag = tag
else:
self.base_tag = OCTSTRING_TAG
self.override_known_len = 1
self.extensible = 0 # XXX
self.lo = lo
self.hi = hi
def __repr__ (self):
return 'OCTSTRING: ' + repr (self.tag)
class ConsElt:
def __init__ (self):
self.lst = []
def get_cur_def (self, seen_tag):
return OCTSTRING
def handle_val (self, val):
self.lst.append (val)
def finish (self):
return "".join (self.lst)
def start_cons (self, tag, cur_len, ctx):
return self.ConsElt ()
def handle_charset (self, ctx, val):
encoder, strip_bom = ctx.get_enc (self.base_tag)
if trace_string:
print "encoding", type (val), encoder, self.base_tag, strip_bom,
(val, l) = encoder (val)
if strip_bom:
val = val[2:]
if trace_string:
print "encoded", val
return val
def encode_val (self, ctx, val):
val = self.handle_charset (ctx, val)
if cons_encoding:
# Dubuisson, _ASN.1 ..._, 18.2.10 says that string
# types are encoded like OCTETSTRING, so no worries
# about preserving character boundaries in constructed
# encodings.
tag = (0, OCTSTRING_TAG)
for i in range (len (val)):
ctx.tag_write (tag)
ctx.len_write_known (1)
ctx.bytes_write ([ord(val[i])])
else:
ctx.len_write_known (len (val))
ctx.bytes_write (val)
def encode_per (self, ctx, val):
val = handle_charset (ctx, val)
assert (not self.extensible)
l = len (val)
if self.lo <> None and self.lo == self.hi:
if l <= 2:
ctx.write_bits_unaligned (val, l * BYTE_BITS)
elif l <= 8192:
ctx.write_bits (val, l * BYTE_BITS)
else:
assert (0) # XXX need to fragment!
assert (len < 65536)
if self.hi == None:
ctx.write_semiconstrained_int (l, self.lo)
else:
ctx.write_constrained_int (l, self.lo, self.hi)
ctx.write_bits (val, l * BYTE_BITS)
def decode_val (self, ctx, buf):
tmp_str = ''.join (map (chr, buf))
decoder = ctx.get_dec (self.base_tag)
if trace_string:
print "decoding", repr(tmp_str), decoder, self.base_tag
rv = decoder (tmp_str)
if trace_string:
print repr (rv)
return rv [0]
_STRING_TAGS = (UTF8STRING_TAG, NUMERICSTRING_TAG, PRINTABLESTRING_TAG,
T61STRING_TAG, VIDEOTEXSTRING_TAG, IA5STRING_TAG,
GRAPHICSTRING_TAG, VISIBLESTRING_TAG, GENERALSTRING_TAG,
UNIVERSALSTRING_TAG, BMPSTRING_TAG, GENERALIZEDTIME_TAG,
OBJECTDESCRIPTOR_TAG)
OCTSTRING = OCTSTRING_class ()
(UTF8String, NumericString, PrintableString, T61String, VideotexString,
IA5String, GraphicString, VisibleString, GeneralString, UniversalString,
BMPString, GeneralizedTime, ObjectDescriptor) = \
map (OCTSTRING_class, _STRING_TAGS)
class CHOICE:
choice_type = 1
# No class.tag, tag derives from chosen arm of CHOICE
def __init__ (self, c):
self.promises_fulfilled = 0
# XXX self.promises_fulfilled is only needed for CHOICE,
# but could speed up by adding checking to SEQUENCE, SEQUENCE_OF, etc.
self.choice = []
# XXX rework this to use dict by arm name, dict by tag?
# but CHOICE of CHOICE constructs mean that a typ can have
# multiple possible tags, so a little more difficult
for arm in c:
self.choice.append (self.mung (arm))
def __getitem__ (self, key):
for (cname, ctyp) in self.choice:
if key == cname:
return ctyp
raise KeyError (key)
def __setitem__ (self, key, val): # warning: may raise KeyError!
for i in range (len (self.choice)):
(cname, ctyp) = self.choice [i]
if cname == key:
self.set_arm (i, val)
return
raise KeyError (key)
def fulfill_promises (self, promises):
if self.promises_fulfilled:
return
self.promises_fulfilled = 1
for i in range (len (self.choice)):
if isinstance (self.choice [i][1], Promise):
self.choice [i][1] = self.choice[i][1].get_promised (promises)
else:
self.choice[i][1].fulfill_promises (promises)
def set_arm (self, i, new_arm):
self.choice[i] = self.mung (new_arm)
def mung (self, arm):
(cname, ctag, ctyp) = arm
ctyp = TYPE (ctag, ctyp)
return [cname, ctyp]
def str_tag (self):
return repr (self)
def check_tag (self, seen_tag):
for (cname, ctyp) in self.choice:
if ctyp.check_tag (seen_tag):
return (cname, ctyp)
return 0
def __repr__ (self):
return 'CHOICE: ' + string.join (map (lambda x:x[0],self.choice), '\n')
# Note: we don't include types in the repr, because that can induce
# infinite recursion.
def encode (self, ctx, val):
if trace_choice: print val
(name, val) = val
for (cname, ctyp) in self.choice:
if cname == name:
if trace_choice: print "Encoding arm", cname, "Val", val
ctyp.encode (ctx, val)
return
err = ("Bogus, no arm for " + repr (name) + " val " +
repr(val))
raise EncodingError,err
# Note: ANY can be any type, not just OCTSTRING. The ASN.1 spec
# is supposed to indicate an OID (or something) which we can use to
# figure out how to encode/decode the ANY type. For EXTERNAL,
# this is well-defined and implemented via register_oid (although we
# don't support indirect_reference).
# On decoding, if the incremental decoder is used and no type
# is specified, the result looks like:
# (tag, , indef-len-flag)
# or a list instead of a string for constructed types.
# (The non-incremental decoder can't handle ANY types with indef-len
# encoding, and just returns a byte string for def-len encoding. I
# recommend the incremental decoder.)
# The encoder expects the output of the incremental decoder.
# Note that indef-len-flag can usually be ignored, and is only
# valuable for applications which decode and then encode and expect
# the results to be byte-identical, which is basically test apps.
class ANY_class(OCTSTRING_class): # inherit decode_val
tag = (CONS_FLAG, ANY_TAG)
class ConsElt:
def __init__ (self, tag, cur_len):
self.tmp = []
self.tag = tag
self.indef_flag = cur_len == None
def get_cur_def (self, seen_tag):
return ANY
def handle_val (self, val):
self.tmp.append (val)
def finish (self):
return (self.tag, self.tmp, self.indef_flag)
def start_cons (self, tag, cur_len, ctx):
return self.ConsElt (tag, cur_len)
def encode_aux (self, val):
(tag, val, indef_flag) = val
if isinstance (val, type ([])):
buf = "".join (map (self.encode_aux, val))
elif isinstance (val, type (())):
buf = self.encode_aux (val)
else:
buf = val
def tostr (lst):
return "".join (map (chr, lst))
if indef_flag:
return tostr (tag_to_buf (tag)) + "\x80" + buf + "\0\0"
else:
buf_len = len (buf)
return tostr (tag_to_buf (tag)) + tostr (len_to_buf (buf_len)) +buf
def encode (self, ctx, val):
ctx.bytes_write (self.encode_aux(val))
def check_tag (self, seen_tag):
return 1
def decode_val (self, ctx, buf):
v = OCTSTRING_class.decode_val (self, ctx, buf)
return (ctx.decoded_tag, v, 0) # only called for primitive def-len encoding, thus "0"
ANY = ANY_class ()
class BitStringVal:
def __init__ (self, top, bits = 0, defn = None):
self.top_ind = top # 0-based, -1 is valid, indicating no sig. bits
self.bits = bits
self.defn = defn
def __repr__ (self):
names = []
for i in range (self.top_ind + 1):
if self.is_set (i):
def mk_unk ():
return "Unknown(%d)" % (i,)
if (not hasattr (self.defn, 'num_to_name') or
self.defn.num_to_name == None):
names.append (mk_unk ())
else:
names.append (self.defn.num_to_name.get (i, mk_unk ()))
return "Top: %s Bits %s Names %s" % (repr(self.top_ind),
repr(self.bits),
",".join (names))
def __cmp__ (self, other):
return cmp ((self.top_ind, self.bits), (other.top_ind, other.bits))
def check_extend (self, bit):
if bit > self.top_ind:
self.bits = self.bits << (bit - self.top_ind)
self.top_ind = bit
def set (self, bit):
self.check_extend (bit)
self.bits = self.bits | (1L << (self.top_ind - bit))
def clear (self, bit):
self.check_extend (bit)
self.bits = self.bits & ~(1L << (self.top_ind - bit))
def set_bits (self, bitseq):
for bit in bitseq:
self.set (bit)
def is_set (self, bit):
if self.top_ind - bit < 0:
return 0
return self.bits & (1L << ( self.top_ind - bit))
def __getitem__ (self, bit_name):
bit_ind = self.defn.get_num_from_name (bit_name)
return self.is_set (bit_ind)
def __setitem__ (self, key, val):
ind = self.defn.get_num_from_name (key)
if val:
self.set (ind)
else:
self.clear (ind)
class BITSTRING_class (ConditionalConstr, ELTBASE, NamedBase):
known_len = 1
def __init__ (self, *args):
self.base_tag = BITSTRING_TAG
self.override_known_len = 0
NamedBase.__init__ (self, *args)
def __call__ (self):
return BitStringVal (self.max, 0, self)
class ConsElt:
def __init__ (self, parent):
self.lst = []
self.parent = parent
def get_cur_def (self, seen_tag):
return BITSTRING
def handle_val (self, val):
self.lst.append (val)
def finish (self):
bits = 0L
for v in self.lst[:-1]:
bits *= 256L
assert (v.top_ind == 7)
bits += v.bits
v = self.lst [-1]
bits *= 256L
pad_count = 7 - v.top_ind
bits = bits >> pad_count
bits += v.bits # v.bits have already been right-shifted by decoder
return BitStringVal (8 * len (self.lst) - pad_count - 1, bits, self.parent)
def start_cons (self, tag, cur_len, ctx):
return self.ConsElt (self)
def encode_val (self, ctx, val):
def top_ind_to_pad_bits (top_ind):
bit_count = (top_ind + 1) % 8 # top_ind is 0-based
if bit_count == 0: return 0
return (8 - bit_count)
assert (top_ind_to_pad_bits (0) == 7)
assert (top_ind_to_pad_bits (7) == 0)
assert (top_ind_to_pad_bits (8) == 7)
assert (top_ind_to_pad_bits (10) == 5)
assert (top_ind_to_pad_bits (15) == 0)
pad_bits_count = top_ind_to_pad_bits (val.top_ind)
val_len = ((val.top_ind + 1) / 8) + 1
# + 1 for count of padding bits, count always 1 byte
if pad_bits_count <> 0:
val_len += 1
l = []
to_write = (1L * val.bits) << pad_bits_count
for i in range (val_len - 1):
l.append (to_write % 256)
to_write = to_write / 256
assert (to_write >= 0)
if not cons_encoding:
ctx.len_write_known (val_len)
l.append (pad_bits_count)
l.reverse ()
ctx.bytes_write (l)
else:
ctx.bytes_write ([0x80]) # Dubuisson p. 403 says indef-len req'd
l.reverse ()
for i in range (len (l) - 1):
v = [0x3, 0x2, 0x0, l[i]]
if trace_bitstring: print "encoding", v
ctx.bytes_write (v)
v = [0x3, 0x2, pad_bits_count, l[-1]]
if trace_bitstring: print "encoding last", v
ctx.bytes_write (v)
ctx.bytes_write ([0x00,0x00])
def decode_val (self, ctx, buf):
if trace_bitstring:
print "bitstring", buf
pad_bits = buf [0]
bits = 0
for b in buf [1:]:
bits = 256L * bits + b
bits = bits >> pad_bits
return BitStringVal ((len(buf) - 1) * 8 - pad_bits - 1 , bits,
self)
BITSTRING = BITSTRING_class ()
class SeqConsElt:
def __init__ (self, seq):
self.index = 0
self.seq = seq
self.tmp = seq.klass ()
def get_cur_def (self, seen_tag):
r = range (self.index, len (self.seq.seq))
for i in r:
(name, typ, optional) = self.seq.seq [i]
if typ.check_tag (seen_tag):
self.index = i
return typ
if not optional:
raise BERError ("SEQUENCE tag %s not found in %s (%d/%d)" %
(str (seen_tag), str (self.seq),
self.index, i))
# OK, we fell off the end. Must just be absent OPTIONAL types.
return None
def handle_val (self,val):
setattr (self.tmp, self.seq.seq[self.index][0], val)
self.index += 1
def finish (self):
for i in range (self.index, len (self.seq.seq)):
(name, typ, optional) = self.seq.seq[i]
if not optional:
raise BERError (
"non-opt data missing from seq %s at %d (so far %s)" %
(str (self.seq), self.index, str (self.tmp)))
return self.tmp
class SEQUENCE_BASE (ELTBASE):
tag = (CONS_FLAG, SEQUENCE_TAG)
known_len = 0
def __init__ (self, klass, seq):
self.klass = klass
self.seq = []
for e in seq:
self.seq.append (self.mung (e))
self.extensible = 0
def __call__ (self, **kw):
return apply (self.klass, (), kw)
def mung (self, e):
if len (e) == 3:
(name, tag, typ) = e
optional = 0
elif len (e) == 4:
(name, tag, typ, optional) = e
else: assert (len(e) == 3 or len(e) == 4)
typ = TYPE (tag, typ)
return (name, typ, optional)
def __repr__ (self):
return ('SEQUENCE: ' + repr (self.klass) +
'\n' + string.join (map (repr, self.seq), '\n'))
def __getitem__ (self, key):
for e in self.seq:
if e[0] == key:
return e[1]
raise KeyError (key)
def __setitem__ (self, key, val):
for i in range (len (self.seq)):
if self.seq[i][0] == key:
self.seq[i] = self.mung (val)
return
raise "not found" + str (key)
def fulfill_promises (self, promises):
for i in range (len(self.seq)):
(name, typ, optional) = self.seq[i]
if isinstance (typ, Promise):
self.seq[i] = (name, typ.get_promised (promises), optional)
else:
typ.fulfill_promises (promises)
def get_attribs (self):
return map (lambda e: e[0], self.seq)
def start_cons (self, tag, cur_len, ctx):
return SeqConsElt (self)
def encode_per (self, ctx, val):
any_optional = 0 # XXX replace w/ every
for (attrname, typ, optional) in self.seq:
any_optional = any_optional or optional
if any_optional:
for (attrname, typ, optional) in self.seq:
ctx.write_bits_unaligned (hasattr (val, attrname), 1)
for (attrname, typ, optional) in self.seq:
try:
v = getattr (val, attrname)
# XXX need to handle DEFAULT,not encode
except AttributeError:
if optional: continue
else: raise EncodingError, ("Val " + repr(val) +
" missing attribute: " +
str(attrname))
if trace_seq: print "Encoding", attrname, v
typ.encode_per (ctx, v)
def encode_val (self, ctx, val):
for (attrname, typ, optional) in self.seq:
try:
v = getattr (val, attrname)
except AttributeError:
if optional: continue
else: raise EncodingError, ("Val " + repr(val) +
" missing attribute: " +
str(attrname))
if trace_seq: print "Encoding", attrname, v
typ.encode (ctx, v)
import new
# SEQUENCE returns an object which is both an asn.1 spec and a callable
# which generates a struct template to fill in.
# I used to have SEQUENCE taking a classname and, using ~8 lines of
# black (OK, grayish) magic (throw an exn, catch it, and futz with the
# caller's locals dicts), bind the klass below in the caller's namespace.
# This meant I could provide bindings for SEQUENCEs nested inside other
# definitions (making my specs look more like the original ASN.1), and
# that I got the correct name for debugging purposes instead of using
# mk_klass_name (). I took it out b/c I didn't like the magic or the
# funny syntax it used (a mere function call caused an alteration to the
# caller's ns)
# Now, the compiler takes care of generating the correct names for
# top-level SEQUENCE definitions, and should be extended to handle
# SEQUENCEs nested inside others.
class Ctr:
def __init__ (self):
self.count = 0
def __call__ (self):
self.count = self.count + 1
return self.count
class_count = Ctr ()
# This name only appears in debugging displays, so no big deal.
def mk_seq_class_name ():
return "seq_class_%d" % class_count ()
class EXTERNAL_class (SEQUENCE_BASE):
tag = (CONS_FLAG, EXTERNAL_TAG)
def __repr__ (self):
return ('EXTERNAL: ' + repr (self.klass) +
'\n' + string.join (map (repr, self.seq), '\n'))
class ConsElt(SeqConsElt):
def __init__ (self, seq, ctx):
self.ctx = ctx
self.codec_pushed = 0
SeqConsElt.__init__ (self, seq)
def get_cur_def (self, seen_tag):
self.found_ext_ANY = 0
r = range (self.index, len (self.seq.seq))
for i in r:
(name, typ, optional) = self.seq.seq [i]
if typ.check_tag (seen_tag):
self.index = i
if name == 'encoding' and seen_tag [1] == 0:
asn = check_EXTERNAL_ASN (self.tmp)
if asn <> None:
self.found_ext_ANY = 1
typ = asn
new_codec_fn = self.ctx.charset_switch_oids.get (
getattr (self.tmp, 'direct_reference',
None), None)
if new_codec_fn <> None:
self.ctx.push_codec ()
new_codec_fn ()
self.codec_pushed = 1
return typ
if not optional:
raise BERError ("EXTERNAL tag %s not found in %s (%d/%d)" %
(str (seen_tag), str (self.seq),
self.index, i))
# This is, in fact, an error, because the last bit of
# external isn't optional
raise BERError ("EXTERNAL tag %s not found" % (str (seen_tag),))
def handle_val (self,val):
if self.found_ext_ANY:
val = ('single-ASN1-type', val)
if self.codec_pushed:
self.ctx.pop_codec ()
SeqConsElt.handle_val (self, val)
def start_cons (self, tag, cur_len, ctx):
return self.ConsElt (self, ctx)
def encode_val (self, ctx, val):
new_codec_fn = None
for (attrname, typ, optional) in self.seq:
try:
v = getattr (val, attrname)
except AttributeError:
if optional: continue
else: raise EncodingError, ("Val " + repr(val) +
" missing attribute: " +
str(attrname))
if attrname == 'encoding' and v[0] == 'single-ASN1-type':
asn = check_EXTERNAL_ASN (val)
if asn <> None:
typ = asn
v = v[1]
new_codec_fn = ctx.charset_switch_oids.get (
getattr (val, 'direct_reference', None), None)
if new_codec_fn <> None:
ctx.push_codec ()
new_codec_fn ()
if trace_seq: print "Encoding", attrname, v
typ.encode (ctx, v)
if new_codec_fn <> None:
ctx.pop_codec ()
# XXX rename all these
def SEQUENCE (spec, base_typ = SEQUENCE_BASE, seq_name = None,
extra_bases = None):
if seq_name == None:
seq_name = mk_seq_class_name ()
bases = [StructBase]
if extra_bases <> None:
bases = extra_bases + bases
klass = new.classobj (seq_name, tuple (bases), {})
seq = base_typ (klass, spec)
klass._allowed_attrib_list = seq.get_attribs ()
seq.klass = klass
return seq
# This is the pre-1994 def'n. Note that post-1994 removes the ANY
# and BITSTRING options
EXTERNAL = SEQUENCE ([('direct_reference', None, OID, 1),
('indirect_reference', None, INTEGER, 1),
('data_value_descriptor', None, ObjectDescriptor, 1),
('encoding', None,
CHOICE([('single-ASN1-type', EXPLICIT(0), ANY),
('octet-aligned', 1, OCTSTRING),
('arbitrary', 2, BITSTRING)]))],
EXTERNAL_class,
seq_name = 'EXTERNAL')
import math
class REAL_class (SEQUENCE_BASE):
tag = (CONS_FLAG, REAL_TAG)
# note clients are allowed to treat equal numbers in different bases as
# different, so keep mantissa/base/exponent
class REAL_val:
_mantissa_bits = 20 # XXX is there no way to auto-determine correct val?
def __repr__ (self):
return 'REAL %f' % (self.get_val ())
def set_val (self, val):
m, e = math.frexp (val)
self.mantissa = int (m * pow (2, self._mantissa_bits))
self.base = 2
self.exponent = e - self._mantissa_bits
return self
def get_val (self):
return self.mantissa * pow (self.base, self.exponent)
REAL = SEQUENCE([('mantissa', None, INTEGER),
('base', None, INTEGER),
('exponent', None, INTEGER)],
REAL_class,
seq_name='REAL',
extra_bases = [REAL_val])
REAL.get_val = lambda self: (self.mantissa * 1.0 / self.base) * pow (self.base, self.exponent)
REAL.__str__ = lambda self: "REAL %f" % (self.get_val (),)
_oid_to_asn1_dict = {}
def register_oid (oid, asn):
tmp = EXPLICIT(0) # b/c ANY is EXPLICIT 0 arm of EXTERNAL CHOICE
tmp.set_typ (asn)
_oid_to_asn1_dict [OidVal (oid)] = tmp
def check_EXTERNAL_ASN (so_far):
if trace_external:
print "in check", so_far, EXTERNAL.klass
print "check 2", so_far.__class__
assert (so_far.__class__ == EXTERNAL.klass) # only called from w/in EXTERNAL
dir_ref = getattr (so_far, 'direct_reference', None)
if dir_ref == None:
return
# in theory, should provide support for indirect_reference
# indicating encoding type, but callers can receive asn1.ANY
# decoded data, reencode it, and then redecode it with a proper
# spec as a workaround. Let me know if you actually use
# indirect_reference.
if trace_external:
print "so_far", so_far, dir_ref
rv = _oid_to_asn1_dict.get (dir_ref, None)
if trace_external:
print rv, _oid_to_asn1_dict
return rv
class SEQUENCE_OF(ELTBASE):
tag = (CONS_FLAG, SEQUENCE_TAG)
known_len = 0
def __init__ (self, typ):
self.typ = typ
def __getitem__ (self, key):
if key == 0:
return self.typ
raise KeyError (key)
def fulfill_promises (self, promises):
if isinstance (self.typ, Promise):
self.typ = self.typ.get_promised (promises)
else:
self.typ.fulfill_promises (promises)
class ConsElt:
def __init__ (self, typ):
self.typ = typ
self.lst = []
def get_cur_def (self, seen_tag):
return self.typ
def handle_val (self, val):
self.lst.append (val)
def finish (self):
return self.lst
def start_cons (self, tag, cur_len, ctx):
return self.ConsElt (self.typ)
def encode_val (self, ctx, val):
for e in val:
self.typ.encode (ctx, e)
class SET_OF(SEQUENCE_OF): # XXX SET_OF needs more implementation
pass
def sgn(val):
if val < 0: return -1
if val == 0: return 0
return 1
class BOOLEAN_class (ELTBASE):
tag = (0, BOOL_TAG)
known_len = 1
def encode_val (self, ctx, val):
ctx.len_write_known (1)
ctx.bytes_write ([val <> 0])
# if val is multiple of 256, Python would treat as true, but
# just writing val would truncate. Thus, write val <> 0
def encode_per (self, ctx, val):
ctx.write_bits_unaligned (val <> 0, 1)
def decode_val (self, ctx,buf):
mylen = len (buf)
if mylen <> 1: ctx.raise_error ("Bogus length for bool " +
repr (mylen))
# "not not" to canonicalize. Really only needed for round-trip
# decode - reencode - redecode testing
return not not buf [0]
BOOLEAN = BOOLEAN_class ()
class NULL_class (ELTBASE):
tag = (0, NULL_TAG)
known_len = 1
def encode_val (self, ctx, val):
ctx.len_write_known (0)
def encode_per (self, ctx, val):
pass
def decode_val (self, ctx, buf):
if len (buf) > 0: ctx.raise_error ("Bad length for NULL" + str (buf))
return None
NULL = NULL_class ()
class ENUM (INTEGER_class):
def __init__ (self, **kw):
self.__dict__.update (kw)
OBJECT_IDENTIFIER = OID # for convenience of compiler
class Promise(ELTBASE):
"""Placeholder for generating recursive data structures.
Replaced by calling fulfill_promises method."""
def __init__ (self, type_name):
self.type_name = type_name
def get_promised (self, promises_dict):
return promises_dict[self.type_name]
def __str__ (self):
return 'Promise: ' + self.type_name
class Tester:
def __init__ (self, print_test):
self.idc1 = IncrementalDecodeCtx (NULL)
self.idc2 = IncrementalDecodeCtx (ANY)
self.print_test = print_test
def test (self, spec, val, assertflag = 1):
# XXX add an optional correct encoding to check against, and cmpfn
buf = encode (spec, val)
if self.print_test:
for byte in buf:
print hex (byte)[2:],
print
self.idc1.asn1_def = spec
self.idc1.feed (buf)
self.idc2.feed (buf)
print self.idc1.get_bytes_inprocess_count ()
print self.idc2.get_bytes_inprocess_count ()
assert (self.idc1.get_bytes_inprocess_count () == 0)
assert (self.idc2.get_bytes_inprocess_count () == 0)
assert (self.idc1.val_count () == 1)
assert (self.idc2.val_count () == 1)
idec = self.idc1.get_first_decoded ()
idec2 = self.idc2.get_first_decoded ()
buf2 = encode (ANY, idec2)
if self.print_test:
for byte in buf2:
print hex (byte)[2:],
print
if self.print_test:
print "Val",repr(val), "idec", repr (idec), "any", idec2
if assertflag:
if buf2 <> buf:
print "buf1, buf2 differ"
assert (idec == val)
def run (self):
int_spec = TYPE (EXPLICIT(3), INTEGER)
string_spec = TYPE (5, GeneralString)
bitstring_spec = TYPE (5, BITSTRING)
octstring_spec = TYPE (5, OCTSTRING)
bool_spec = TYPE(100, BOOLEAN)
self.test (bool_spec, 0)
self.test (bool_spec, 1)
self.test (bool_spec, -1, 0)
self.test (bool_spec, 1024, 0)
self.test (int_spec, 4)
self.test (int_spec, 256)
self.test (int_spec, -128)
self.test (int_spec, -129) # should be 83 02 FF 7F
self.test (int_spec, -1)
self.test (int_spec, 0)
self.test (int_spec, -27066) # should be 83 02 96 46
self.test (string_spec, '')
self.test (string_spec, 'Lemon curry?')
self.test (octstring_spec, '\xFF\x00\x99 Foo')
oid_spec = TYPE (4, OID)
oid = OidVal ([1, 2, 840, 10003, 0, 1])
self.test (oid_spec, oid)
null_spec = TYPE (65536, NULL)
self.test (null_spec, None)
real_spec = TYPE(3,REAL)
real_spec2 = REAL
rval = REAL ()
rval.set_val (4.0)
assert 4.0 == rval.get_val ()
self.test (real_spec, rval)
self.test (real_spec2, rval)
bs_test = BitStringVal (17, 0x1B977L) # 011011100101110111
print "bs_test", bs_test
for i in range (10):
print "bitstring", i, bs_test
self.test (bitstring_spec, bs_test)
bs_test.top_ind = bs_test.top_ind + 1
seq_of_spec = SEQUENCE_OF (int_spec)
self.test (seq_of_spec, [1,44,131072])
seq_of_spec = SEQUENCE_OF (TYPE(1, INTEGER))
self.test (seq_of_spec, [1,44,131072])
seq_of_spec = SEQUENCE_OF (INTEGER)
self.test (seq_of_spec, [1,44,131072])
seq_of_spec2 = TYPE (18, SEQUENCE_OF (TYPE(105,GeneralString)))
self.test (seq_of_spec2, ['db'])
self.test (seq_of_spec2, ['db1', 'db2', 'db3'])
self.test (seq_of_spec2, [])
seq_of3 = SEQUENCE_OF(Promise('s'))
seq_of3.fulfill_promises ({'s': seq_of3})
self.test (seq_of3, [[[],[],[[[[]]]]]])
# stupendously useless without a CHOICE in the SEQUENCE_OF
# to introduce ground terms, but hey.
choice_spec = CHOICE ([('foo', 1, INTEGER),
('bar', None, INTEGER),
('baz', None, string_spec),
('foobar', None, seq_of_spec2)])
self.test (choice_spec, ('foo', 2))
self.test (choice_spec, ('bar', 3))
self.test (choice_spec, ('baz', 'choose wisely'))
self.test (choice_spec, ('foobar', ['choose wisely', 'choose stupidly']))
choice2_spec = CHOICE ([('a', 1, INTEGER),
('b', EXPLICIT(2), Promise('choice2')),
('c', 3, SEQUENCE_OF(Promise('choice2')))])
# EXPLICIT is necessary to avoid CHOICE of CHOICE without tag
# to figure out which arm to take
choice2_spec.fulfill_promises ({'choice2' : choice2_spec})
c2 = ('c', [('a', 4),
('b', ('c', [('a', 5), ('b', ('a', 6))]))])
self.test (choice2_spec, c2)
seq_spec = SEQUENCE (
[('a',5, INTEGER),
('c', 51, INTEGER, 1),
('b',6, INTEGER)])
class Foo (seq_spec.klass):
def __init__ (self, a = 0,b = 0):
StructBase.__init__ (self)
self.a = a
self.b = b
seq_test = Foo (4,5)
self.test (seq_spec, seq_test)
seq_test = Foo (4,5)
seq_test.c = 9
self.test (seq_spec, seq_test)
v = EXTERNAL ()
v.direct_reference = oid
v.data_value_descriptor = "infrequently used field"
v.encoding = ('octet-aligned', 'foo bar')
self.test (EXTERNAL, v)
v.direct_reference = OidVal(SUTRS)
v.encoding = ('single-ASN1-type', 'This is a SUTRS string')
self.test (EXTERNAL, v)
big_spec_test = SEQUENCE ([('a', 5, INTEGER),
('b', 4096, GeneralString)])
sq = big_spec_test ()
sq.a = 1
sq.b = '34' * 8192
self.test (big_spec_test, sq)
sq.b = '35' * (65536 * 2)
self.test (big_spec_test, sq)
try:
sq.c = 'bogus'
except AttributeError, exn:
assert (exn.args == ('c',))
else: assert (0)
bitstringval = BitStringVal (12, 0x16eb)
encoded_val = encode (BITSTRING, bitstringval)
Dubuisson_prim_val = [0x3, 0x3, 0x3, 0xB7, 0x58]
Dubuisson_cons_val = [0x23, 0x80, # see pp. 402-404
0x3, 0x2, 0x0, 0xB7,
0x3, 0x2, 0x3, 0x58,
0x0, 0x0]
if cons_encoding:
Dubuisson_val = Dubuisson_cons_val
else:
Dubuisson_val = Dubuisson_prim_val
print encoded_val, Dubuisson_val
assert (len (encoded_val) == len (Dubuisson_val))
for v1, v2 in zip (encoded_val, Dubuisson_val):
assert (v1 == v2)
self.idc1.asn1_def = BITSTRING
self.idc1.feed (Dubuisson_val)
assert (self.idc1.val_count () == 1)
idec = self.idc1.get_first_decoded ()
print idec
assert (idec.top_ind == 12)
assert (idec.bits == 0x16eb)
SUTRS = [1,2,840,10003,5,101]
def run (print_flag):
t = Tester (print_flag)
global cons_encoding, indef_len_encodings # XXX why is global needed?
register_oid (SUTRS, GeneralString)
for indef_len_encodings in [0,1]:
for cons_encoding in [0,1]:
print "Starting", indef_len_encodings, cons_encoding
t.run ()
print "byte offset", t.idc1.offset, t.idc2.offset
import profile
if __name__ == '__main__':
pwc = PERWriteCtx (aligned = 0)
inner_seq_def = SEQUENCE ([
('d1', 0, BOOLEAN),
('d2', 0, BOOLEAN)])
test_def = SEQUENCE ([
('a', 0, INTEGER_class (None, 0,7)),
('b', 0, BOOLEAN),
('c', 0, INTEGER_class (None, 0,3)),
('d', 0, inner_seq_def)])
test = test_def ()
test.a = 5
test.b = 1
test.c = 1
test.d = inner_seq_def ()
test.d.d1 = 1
test.d.d2 = 1
test_def.encode_per (pwc, test)
print "bit offset", pwc.bit_offset
print map (hex, pwc.get_data ())
if 0:
profile.run ("run (0)")
else:
run (1)