Files
md5/md5.lisp
Pierre R. Mai 576ae1de32 Actually this release was the first public release. It switches over to
using kernel:32bit-logical-* instead of the silly signed-byte acrobatics
that were previously needed to get the various logical and ash operations
optimized.  Also added rudimentary file-comment.
2012-10-14 15:07:41 +02:00

411 lines
15 KiB
Common Lisp

;;;; This code implements MD5 checksums as defined in RFC 1321
;;;; It was written by Pierre R. Mai and placed into the public domain.
(defpackage :MD5 (:use :CL)
(:export
;; Low-Level types and functions
#:md5-regs #:initial-md5-regs #:md5regs-checksum
#:update-md5-block #:fill-block #:fill-block-ub8 #:fill-block-char
;; Mid-Level types and functions
#:md5-state #:md5-state-p #:make-md5-state
#:update-md5-state #:finalize-md5-state
;; High-Level functions on streams/files
#:md5sum-stream #:md5sum-file))
(in-package :MD5)
(eval-when (:compile-toplevel)
(defparameter *old-expansion-limit* ext:*inline-expansion-limit*)
(setq ext:*inline-expansion-limit* (max ext:*inline-expansion-limit* 1000)))
;;; Section 3.4: Auxilliary functions
(deftype ub32 () `(unsigned-byte 32))
(declaim (inline f g h i)
(ftype (function (ub32 ub32 ub32) ub32) f g h i))
(defun f (x y z)
(declare (type ub32 x y z)
(optimize (speed 3) (safety 0) (space 0) (debug 0)))
(kernel:32bit-logical-or (kernel:32bit-logical-and x y)
(kernel:32bit-logical-andc1 x z)))
(defun g (x y z)
(declare (type ub32 x y z)
(optimize (speed 3) (safety 0) (space 0) (debug 0)))
(kernel:32bit-logical-or (kernel:32bit-logical-and x z)
(kernel:32bit-logical-andc2 y z)))
(defun h (x y z)
(declare (type ub32 x y z)
(optimize (speed 3) (safety 0) (space 0) (debug 0)))
(kernel:32bit-logical-xor x (kernel:32bit-logical-xor y z)))
(defun i (x y z)
(declare (type ub32 x y z)
(optimize (speed 3) (safety 0) (space 0) (debug 0)))
(kernel:32bit-logical-xor y (kernel:32bit-logical-orc2 x z)))
(declaim (inline mod32+ rol32)
(ftype (function (ub32 ub32) ub32) mod32+))
(defun mod32+ (a b)
(declare (type ub32 a b) (optimize (speed 3) (safety 0) (space 0) (debug 0)))
(ext:truly-the ub32 (+ a b)))
(declaim (ftype (function (ub32 (unsigned-byte 5)) ub32) rol32))
(defun rol32 (a s)
(declare (type ub32 a) (type (unsigned-byte 5) s)
(optimize (speed 3) (safety 0) (space 0) (debug 0)))
(kernel:32bit-logical-or (kernel:shift-towards-end a s)
(ash a (- s 32))))
(eval-when (:compile-toplevel :load-toplevel :execute)
(defparameter *t* (make-array 64 :element-type 'ub32
:initial-contents
(loop for i from 1 to 64
collect
(truncate
(* 4294967296
(abs (sin (float i 0.0d0)))))))))
(defmacro with-md5-round ((op block) &rest clauses)
(loop for (a b c d k s i) in clauses
collect
`(setq ,a (mod32+ ,b (rol32 (mod32+ (mod32+ ,a (,op ,b ,c ,d))
(mod32+ (aref ,block ,k)
,(aref *t* (1- i))))
,s)))
into result
finally
(return `(progn ,@result))))
;; Block-level operations
(deftype md5-regs () `(simple-array (unsigned-byte 32) (4)))
(defmacro md5-regs-a (regs)
`(aref ,regs 0))
(defmacro md5-regs-b (regs)
`(aref ,regs 1))
(defmacro md5-regs-c (regs)
`(aref ,regs 2))
(defmacro md5-regs-d (regs)
`(aref ,regs 3))
(defconstant +md5-magic-a+ #x67452301)
(defconstant +md5-magic-b+ #xefcdab89)
(defconstant +md5-magic-c+ #x98badcfe)
(defconstant +md5-magic-d+ #x10325476)
(declaim (inline initial-md5-regs))
(defun initial-md5-regs ()
(declare (optimize (speed 3) (safety 0) (space 0) (debug 0)))
(let ((regs (make-array 4 :element-type '(unsigned-byte 32))))
(declare (type md5-regs regs))
(setf (md5-regs-a regs) +md5-magic-a+
(md5-regs-b regs) +md5-magic-b+
(md5-regs-c regs) +md5-magic-c+
(md5-regs-d regs) +md5-magic-d+)
regs))
(defun update-md5-block (regs block)
(declare (type md5-regs regs)
(type (simple-array ub32 (16)) block)
(optimize (speed 3) (safety 0) (space 0) (debug 0)))
(let ((a (md5-regs-a regs)) (b (md5-regs-b regs))
(c (md5-regs-c regs)) (d (md5-regs-d regs)))
(declare (type ub32 a b c d))
;; Round 1
(with-md5-round (f block)
(A B C D 0 7 1)(D A B C 1 12 2)(C D A B 2 17 3)(B C D A 3 22 4)
(A B C D 4 7 5)(D A B C 5 12 6)(C D A B 6 17 7)(B C D A 7 22 8)
(A B C D 8 7 9)(D A B C 9 12 10)(C D A B 10 17 11)(B C D A 11 22 12)
(A B C D 12 7 13)(D A B C 13 12 14)(C D A B 14 17 15)(B C D A 15 22 16))
;; Round 2
(with-md5-round (g block)
(A B C D 1 5 17)(D A B C 6 9 18)(C D A B 11 14 19)(B C D A 0 20 20)
(A B C D 5 5 21)(D A B C 10 9 22)(C D A B 15 14 23)(B C D A 4 20 24)
(A B C D 9 5 25)(D A B C 14 9 26)(C D A B 3 14 27)(B C D A 8 20 28)
(A B C D 13 5 29)(D A B C 2 9 30)(C D A B 7 14 31)(B C D A 12 20 32))
;; Round 3
(with-md5-round (h block)
(A B C D 5 4 33)(D A B C 8 11 34)(C D A B 11 16 35)(B C D A 14 23 36)
(A B C D 1 4 37)(D A B C 4 11 38)(C D A B 7 16 39)(B C D A 10 23 40)
(A B C D 13 4 41)(D A B C 0 11 42)(C D A B 3 16 43)(B C D A 6 23 44)
(A B C D 9 4 45)(D A B C 12 11 46)(C D A B 15 16 47)(B C D A 2 23 48))
;; Round 4
(with-md5-round (i block)
(A B C D 0 6 49)(D A B C 7 10 50)(C D A B 14 15 51)(B C D A 5 21 52)
(A B C D 12 6 53)(D A B C 3 10 54)(C D A B 10 15 55)(B C D A 1 21 56)
(A B C D 8 6 57)(D A B C 15 10 58)(C D A B 6 15 59)(B C D A 13 21 60)
(A B C D 4 6 61)(D A B C 11 10 62)(C D A B 2 15 63)(B C D A 9 21 64))
;; Update and return
(setf (md5-regs-a regs) (mod32+ (md5-regs-a regs) a)
(md5-regs-b regs) (mod32+ (md5-regs-b regs) b)
(md5-regs-c regs) (mod32+ (md5-regs-c regs) c)
(md5-regs-d regs) (mod32+ (md5-regs-d regs) d))
regs))
(declaim (inline fill-block fill-block-ub8 fill-block-char))
(defun fill-block (block buffer offset)
(declare (type (integer 0 #.(- most-positive-fixnum 64)) offset)
(type (simple-array ub32 (16)) block)
(type (simple-array * (*)) buffer)
(optimize (speed 3) (safety 0) (space 0) (debug 0)))
#+(and cmu x86)
(kernel:bit-bash-copy
buffer (+ (* vm:vector-data-offset vm:word-bits) (* offset vm:byte-bits))
block (* vm:vector-data-offset vm:word-bits)
(* 64 vm:byte-bits))
#-(and cmu x86)
(etypecase buffer
((simple-array (unsigned-byte 8) (*))
(fill-block-ub8 block buffer offset))
(simple-string
(fill-block-char block buffer offset))))
(defun fill-block-ub8 (block buffer offset)
(declare (type (integer 0 #.(- most-positive-fixnum 64)) offset)
(type (simple-array ub32 (16)) block)
(type (simple-array (unsigned-byte 8) (*)) buffer)
(optimize (speed 3) (safety 0) (space 0) (debug 0)))
#+(and cmu x86)
(kernel:bit-bash-copy
buffer (+ (* vm:vector-data-offset vm:word-bits) (* offset vm:byte-bits))
block (* vm:vector-data-offset vm:word-bits)
(* 64 vm:byte-bits))
#-(and cmu x86)
(loop for i of-type (integer 0 16) from 0
for j of-type (integer 0 #.most-positive-fixnum)
from offset to (+ offset 63) by 4
do
(setf (aref block i)
(ext:truly-the ub32
(logior
(kernel:shift-towards-end
(aref buffer (+ j 3)) 24)
(kernel:shift-towards-end
(aref buffer (+ j 2)) 16)
(kernel:shift-towards-end
(aref buffer (+ j 1)) 8)
(aref buffer j))))))
(defun fill-block-char (block buffer offset)
(declare (type (integer 0 #.(- most-positive-fixnum 64)) offset)
(type (simple-array ub32 (16)) block)
(type simple-string buffer)
(optimize (speed 3) (safety 0) (space 0) (debug 0)))
#+(and cmu x86)
(kernel:bit-bash-copy
buffer (+ (* vm:vector-data-offset vm:word-bits) (* offset vm:byte-bits))
block (* vm:vector-data-offset vm:word-bits)
(* 64 vm:byte-bits))
#-(and cmu x86)
(loop for i of-type (integer 0 16) from 0
for j of-type (integer 0 #.most-positive-fixnum)
from offset to (+ offset 63) by 4
do
(setf (aref block i)
(ext:truly-the ub32
(logior
(kernel:shift-towards-end
(char-code (schar buffer (+ j 3))) 24)
(kernel:shift-towards-end
(char-code (schar buffer (+ j 2))) 16)
(kernel:shift-towards-end
(char-code (schar buffer (+ j 1))) 8)
(char-code (schar buffer j)))))))
(declaim (inline md5regs-checksum))
(defun md5regs-checksum (regs)
(declare (optimize (speed 3) (safety 0) (space 0) (debug 0))
(type md5-regs regs))
(let ((result (make-array 16 :element-type '(unsigned-byte 8))))
(declare (type (simple-array (unsigned-byte 8) (16)) result))
(macrolet ((frob (reg offset)
(let ((var (gensym)))
`(let ((,var ,reg))
(declare (type ub32 ,var))
(setf
(aref result ,offset) (ldb (byte 8 0) ,var)
(aref result ,(+ offset 1)) (ldb (byte 8 8) ,var)
(aref result ,(+ offset 2)) (ldb (byte 8 16) ,var)
(aref result ,(+ offset 3)) (ldb (byte 8 24) ,var))))))
(frob (md5-regs-a regs) 0)
(frob (md5-regs-b regs) 4)
(frob (md5-regs-c regs) 8)
(frob (md5-regs-d regs) 12))
result))
;; Mid-Level Drivers
(defstruct (md5-state
(:constructor make-md5-state ()))
(regs (initial-md5-regs) :type md5-regs :read-only t)
(amount 0 :type (unsigned-byte 29))
(block (make-array 16 :element-type '(unsigned-byte 32)) :read-only t
:type (simple-array (unsigned-byte 32) (16)))
(buffer (make-array 64 :element-type '(unsigned-byte 8)) :read-only t
:type (simple-array (unsigned-byte 8) (64)))
(buffer-index 0 :type (integer 0 63))
(finalized-p nil))
(declaim (inline copy-to-buffer))
(defun copy-to-buffer (from from-offset count buffer buffer-offset)
(declare (optimize (speed 3) (safety 0) (space 0) (debug 0))
(type (unsigned-byte 29) from-offset)
(type (integer 0 63) count buffer-offset)
(type (simple-array * (*)) from)
(type (simple-array (unsigned-byte 8) (64)) buffer))
#+(and cmu x86)
(kernel:bit-bash-copy
from (+ (* vm:vector-data-offset vm:word-bits) (* from-offset vm:byte-bits))
buffer (+ (* vm:vector-data-offset vm:word-bits)
(* buffer-offset vm:byte-bits))
(* count vm:byte-bits))
#-(and cmu x86)
(etypecase from
(simple-string
(loop for buffer-index of-type (integer 0 64) from buffer-offset
for from-index of-type fixnum from from-offset
below (+ from-offset count)
do
(setf (aref buffer buffer-index)
(char-code (schar from from-index)))))
((simple-array (unsigned-byte 8) (*))
(loop for buffer-index of-type (integer 0 64) from buffer-offset
for from-index of-type fixnum from from-offset
below (+ from-offset count)
do
(setf (aref buffer buffer-index) (aref from from-index))))))
(defun update-md5-state (state sequence &key (start 0) (end (length sequence)))
(declare (type md5-state state)
(type (simple-array * (*)) sequence)
(type fixnum start end)
(optimize (speed 3) (space 0) (debug 0)))
(let ((regs (md5-state-regs state))
(block (md5-state-block state))
(buffer (md5-state-buffer state))
(buffer-index (md5-state-buffer-index state))
(length (- end start)))
(declare (type md5-regs regs) (type fixnum length)
(type (integer 0 63) buffer-index)
(type (simple-array (unsigned-byte 32) (16)) block)
(type (simple-array (unsigned-byte 8) (64)) buffer))
;; Handle old rest
(unless (zerop buffer-index)
(let ((amount (min (- 64 buffer-index) length)))
(declare (type (integer 0 63) amount))
(copy-to-buffer sequence start amount buffer buffer-index)
(setq start (the fixnum (+ start amount)))
(when (>= start end)
(setf (md5-state-buffer-index state) (+ buffer-index amount))
(return-from update-md5-state state)))
(fill-block-ub8 block buffer 0)
(update-md5-block regs block))
;; Handle main-part and new-rest
(etypecase sequence
((simple-array (unsigned-byte 8) (*))
(locally
(declare (type (simple-array (unsigned-byte 8) (*)) sequence))
(loop for offset of-type (unsigned-byte 29) from start below end by 64
until (< (- end offset) 64)
do
(fill-block-ub8 block sequence offset)
(update-md5-block regs block)
finally
(let ((amount (- end offset)))
(unless (zerop amount)
(copy-to-buffer sequence offset amount buffer 0))
(setf (md5-state-buffer-index state) amount)))))
(simple-string
(locally
(declare (type simple-string sequence))
(loop for offset of-type (unsigned-byte 29) from start below end by 64
until (< (- end offset) 64)
do
(fill-block-char block sequence offset)
(update-md5-block regs block)
finally
(let ((amount (- end offset)))
(unless (zerop amount)
(copy-to-buffer sequence offset amount buffer 0))
(setf (md5-state-buffer-index state) amount))))))
(setf (md5-state-amount state) (+ (md5-state-amount state) length))
state))
(defun finalize-md5-state (state)
(declare (type md5-state state)
(optimize (speed 3) (space 0) (debug 0)))
(or (md5-state-finalized-p state)
(let ((regs (md5-state-regs state))
(block (md5-state-block state))
(buffer (md5-state-buffer state))
(buffer-index (md5-state-buffer-index state))
(total-length (md5-state-amount state)))
(declare (type md5-regs regs)
(type (unsigned-byte 29) total-length)
(type (integer 0 63) buffer-index)
(type (simple-array ub32 (16)) block)
(type (simple-array (unsigned-byte 8) (*)) buffer))
(setf (aref buffer buffer-index) #x80)
(loop for index of-type (integer 0 64)
from (1+ buffer-index) below 64
do (setf (aref buffer index) #x00))
(fill-block-ub8 block buffer 0)
(when (< buffer-index 56)
(setf (aref block 14) (* total-length 8)))
(update-md5-block regs block)
(when (< 56 buffer-index 64)
(loop for index of-type (integer 0 16) from 0 below 16
do (setf (aref block index) #x00000000))
(setf (aref block 14) (* total-length 8))
(update-md5-block regs block))
(setf (md5-state-finalized-p state)
(md5regs-checksum regs)))))
;; High-Level Drivers
(defconstant +buffer-size+ (* 128 1024))
(deftype buffer-index () `(integer 0 ,+buffer-size+))
(defun md5sum-stream (stream)
(declare (optimize (speed 3) (space 0) (debug 0)))
(let ((state (make-md5-state)))
(declare (type md5-state state))
(cond
((equal (stream-element-type stream) '(unsigned-byte 8))
(let ((buffer (make-array +buffer-size+ :element-type '(unsigned-byte 8))))
(declare (type (simple-array (unsigned-byte 8) (#.md5::+buffer-size+))
buffer))
(loop for bytes of-type buffer-index = (read-sequence buffer stream)
do (update-md5-state state buffer :end bytes)
until (< bytes +buffer-size+)
finally
(return (finalize-md5-state state)))))
((equal (stream-element-type stream) 'character)
(let ((buffer (make-string +buffer-size+)))
(declare (type (simple-string #.md5::+buffer-size+) buffer))
(loop for bytes of-type buffer-index = (read-sequence buffer stream)
do (update-md5-state state buffer :end bytes)
until (< bytes +buffer-size+)
finally
(return (finalize-md5-state state)))))
(t
(error "Unsupported stream element-type ~S for stream ~S."
(stream-element-type stream) stream)))))
(defun md5sum-file (pathname)
(declare (optimize (speed 3) (space 0) (debug 0)))
(with-open-file (stream pathname :element-type '(unsigned-byte 8))
(md5sum-stream stream)))
(eval-when (:compile-toplevel)
(setq ext:*inline-expansion-limit* *old-expansion-limit*))