/usr/share/acl2-6.3/books/str/base64.lisp is in acl2-books-source 6.3-5.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 | ; ACL2 String Library
; Copyright (C) 2009-2013 Centaur Technology
;
; Contact:
; Centaur Technology Formal Verification Group
; 7600-C N. Capital of Texas Highway, Suite 300, Austin, TX 78731, USA.
; http://www.centtech.com/
;
; This program is free software; you can redistribute it and/or modify it under
; the terms of the GNU General Public License as published by the Free Software
; Foundation; either version 2 of the License, or (at your option) any later
; version. This program is distributed in the hope that it will be useful but
; WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
; FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
; more details. You should have received a copy of the GNU General Public
; License along with this program; if not, write to the Free Software
; Foundation, Inc., 51 Franklin Street, Suite 500, Boston, MA 02110-1335, USA.
;
; Original author: Jared Davis <jared@centtech.com>
(in-package "STR")
(include-book "cutil/define" :dir :system)
(include-book "natstr")
(local (include-book "centaur/bitops/equal-by-logbitp" :dir :system))
(local (include-book "arithmetic/top-with-meta" :dir :system))
(local (include-book "arithmetic"))
(defsection base64
:parents (str)
:short "Routines for Base 64 string encoding/decoding."
:long "<p>We implement ACL2 functions for Base 64 encoding and decoding as
described in <a href='http://www.ietf.org/rfc/rfc4648.txt'>RFC 4648</a>.</p>
<p>Our functions are quite efficient, given the constraints of ACL2 string
processing. We prove the following inversion theorem, which shows that if
encode some text and then try to decode it, then (1) decoding succeeds and (2)
we get the original text back.</p>
@(thm base64-decode-of-base64-encode)
<p>Of course, this theorem does not say anything about whether we have encoded
or decoded the text \"correctly\" as described in RFC 4648. After all, if we
simply used the identity function as our encoder and decoder, the above theorem
would still hold.</p>
<p>However, to the degree possible, our encoder/decoder are intended to
implement Base64 encoding as described by RFC 4648. We do not implement
variants of base64 encoding such as \"base64 URL encoding\" and \"base64 MIME
encoding.\" Some particular details of our implementation:</p>
<ul>
<li>Per Section 3.1, our encoder does not add line breaks.</li>
<li>Per Section 3.2, our encoder adds appropriate padding characters.</li>
<li>Per Section 3.3, our decoder rejects data with non-alphabet
characters.</li>
<li>Per Section 3.5, our encoder sets the pad bits to zero.</li>
<li>We use the Base64 alphabet described in Table 1. We do not use the \"URL
and Filename safe\" Base64 alphabet.</li>
</ul>
<p>We have not attempted to prove the \"other\" inversion property, i.e., if we
start with some encoded text, decode it, and re-encode the result, then we
should get back our initial, encoded text. This is probably not currently
true. To prove it, we would need to change the decoder to reject inputs where
the pad bits are nonzero. Implementations \"may\" choose to implement this
check according to Section 3.5, and in principle it would be a nice
enhancement.</p>")
(defsection base64-impl
:parents (base64)
:short "Implementation details of @(see base64) encoding/decoding."
:long "<p>These routines should generally not be used directly, and may be
changed in future versions of the library.</p>
<p>Here are some naming conventions used throughout these functions:</p>
<ul>
<li><b>chars</b> refer to actual @(see characters), which typically will be in
the Base64 alphabet, i.e., @('A-Z'), @('a-z'), @('0-9'), @('+'), and @('/').
Of course, when decoding, data might be coming from some external source; it
might contain pad characters @('=') or even arbitrary, invalid characters from
beyond the Base64 alphabet.</li>
<li><b>codes</b> refer to actual @(see char-code)s, with the usual
correspondence to <i>chars</i>.</li>
<li><b>values</b> refer to the interpretation of each Base64 character as a
numeric value. For instance, the value of @('#\A') is 0; the value of @('#\B')
is 1, and so on. In our representation, the values are exactly the 64 natural
numbers from 0-63, and can be recognized with, e.g., @('(unsigned-byte-p 6
val)').</li>
<li><b>bytes</b> refer to ordinary 8-bit bytes, which typically will be part of
the original, un-encoded data.</li>
</ul>")
; ----------------------------------------------------------------------------
;
; SUPPORTING LEMMAS
;
; ----------------------------------------------------------------------------
(define char-code-list ((x character-listp))
(if (atom x)
nil
(cons (char-code (car x))
(char-code-list (cdr x)))))
(local (defsection characterp-of-char
(local (defthm x0
(equal (< (+ c a) (+ c b))
(< a b))))
(local (defthm x1
(equal (< (+ -1 a) b)
(< a (+ 1 b)))
:hints(("Goal"
:in-theory (disable x0)
:use ((:instance x0 (c 1)
(a (+ -1 a))
(b b)))))))
(local (defthm characterp-of-nth
(implies (character-listp x)
(equal (characterp (nth n x))
(< (nfix n) (len x))))))
(defthm characterp-of-char
(equal (characterp (char s n))
(< (nfix n) (len (explode s)))))))
(local (defsection unsigned-byte-p-lemmas
(defthm unsigned-byte-p-6-upper-bound
(implies (unsigned-byte-p 6 x)
(< x 64)))
(defthm unsigned-byte-p-8-upper-bound
(implies (unsigned-byte-p 8 x)
(< x 256)))
(defthm unsigned-byte-p-8-of-char-code
(unsigned-byte-p 8 (char-code x)))))
(local (in-theory (disable unsigned-byte-p char)))
(local (defthm true-listp-when-character-listp
(implies (character-listp x)
(true-listp x))
:rule-classes ((:rewrite) (:compound-recognizer))))
(local (defthm stringp-when-character-listp
(implies (character-listp x)
(equal (stringp x)
nil))))
(local (defthm consp-under-iff-when-true-listp
(implies (true-listp x)
(iff (consp x)
x))
:rule-classes ((:rewrite :backchain-limit-lst 0))))
; ----------------------------------------------------------------------------
;
; Value (0-63) <---> Base 64 Alphabet Character
;
; ----------------------------------------------------------------------------
(defsection *b64-chars-from-vals-array*
:parents (b64-char-from-value)
:short "Array mapping each value to its associated character."
:long "<p>This array is the main lookup table used for encoding. It
corresponds to Table 1 from RFC 4648.</p>
@(def *b64-chars-from-vals-alist*)
@(def *b64-chars-from-vals-array*)"
(defconst *b64-chars-from-vals-alist*
'((0 . #\A)
(1 . #\B)
(2 . #\C)
(3 . #\D)
(4 . #\E)
(5 . #\F)
(6 . #\G)
(7 . #\H)
(8 . #\I)
(9 . #\J)
(10 . #\K)
(11 . #\L)
(12 . #\M)
(13 . #\N)
(14 . #\O)
(15 . #\P)
(16 . #\Q)
(17 . #\R)
(18 . #\S)
(19 . #\T)
(20 . #\U)
(21 . #\V)
(22 . #\W)
(23 . #\X)
(24 . #\Y)
(25 . #\Z)
(26 . #\a)
(27 . #\b)
(28 . #\c)
(29 . #\d)
(30 . #\e)
(31 . #\f)
(32 . #\g)
(33 . #\h)
(34 . #\i)
(35 . #\j)
(36 . #\k)
(37 . #\l)
(38 . #\m)
(39 . #\n)
(40 . #\o)
(41 . #\p)
(42 . #\q)
(43 . #\r)
(44 . #\s)
(45 . #\t)
(46 . #\u)
(47 . #\v)
(48 . #\w)
(49 . #\x)
(50 . #\y)
(51 . #\z)
(52 . #\0)
(53 . #\1)
(54 . #\2)
(55 . #\3)
(56 . #\4)
(57 . #\5)
(58 . #\6)
(59 . #\7)
(60 . #\8)
(61 . #\9)
(62 . #\+)
(63 . #\/)))
(defconst *b64-chars-from-vals-array*
(compress1 '*b64-chars-from-vals-array*
(cons (list :header
:dimensions (list 64)
:maximum-length 65
:default #\0
:name '*b64-chars-from-vals-array*)
*b64-chars-from-vals-alist*))))
(defsection *b64-vals-from-codes-array*
:parents (b64-value-from-code)
:short "Array mapping each character code back to its associated value."
:long "<p>This is the main lookup table used for decoding. It covers every
character code from 0...255. Codes for characters that aren't part of the
Base64 alphabet are mapped to NIL.</p>
@(def *b64-vals-from-codes-array*)"
(defconst *b64-vals-from-codes-array*
(compress1 '*b64-vals-from-codes-array*
(cons (list :header
:dimensions (list 256)
:maximum-length 257
:default nil
:name '*b64-vals-from-codes-array*)
(pairlis$ (char-code-list (strip-cdrs *b64-chars-from-vals-alist*))
(strip-cars *b64-chars-from-vals-alist*))))))
(define b64-char-from-value ((value :type (unsigned-byte 6)))
:returns (char characterp :rule-classes :type-prescription)
:parents (base64-impl)
:short "Look up the Base64 character for a value, e.g., @('0') → @('#\\A')."
:long "<p>This is our lowest level encoding function. It's just an array
lookup.</p>"
:inline t
(the character (aref1 '*b64-chars-from-vals-array*
*b64-chars-from-vals-array*
value))
///
(defthm b64-char-from-value-never-produces-a-pad
(not (equal (b64-char-from-value value) #\=))))
(define b64-value-from-code ((code :type (unsigned-byte 8)))
:returns (value (or (not value)
(natp value))
:rule-classes :type-prescription)
:parents (base64-impl)
:short "Look up the value of a Base64 character code, e.g., @('(char-code
#\\A)') → @('0')."
:long "<p>This is our lowest level decoding function. It's just an array
lookup. Codes for characters that aren't part of the Base64 alphabet are
mapped to NIL.</p>"
:inline t
(aref1 '*b64-vals-from-codes-array*
*b64-vals-from-codes-array*
(lnfix code))
///
(defthm unsigned-byte-p-6-of-b64-value-from-code
(iff (unsigned-byte-p 6 (b64-value-from-code code))
(b64-value-from-code code)))
(defthm b64-value-from-code-of-b64-char-from-value
(implies (unsigned-byte-p 6 value)
(equal (b64-value-from-code (char-code (b64-char-from-value value)))
value))
:hints(("Goal" :in-theory (e/d (b64-char-from-value unsigned-byte-p)
(equal-of-char-code-and-constant))))))
; ----------------------------------------------------------------------------
;
; 3 Bytes (0-255) <---> 4 Values (0-63)
;
; ----------------------------------------------------------------------------
(define b64-vals-from-bytes (b1 b2 b3)
(declare (type (unsigned-byte 8) b1 b2 b3))
:returns (mv (v1 natp :rule-classes :type-prescription)
(v2 natp :rule-classes :type-prescription)
(v3 natp :rule-classes :type-prescription)
(v4 natp :rule-classes :type-prescription))
:parents (base64-impl)
:short "Encode 3 bytes into 4 base-64 characters."
:long "<p>Convert three bytes into four values, basically as follows:</p>
@({
Byte Bit Pattern ---> Values
b1 aaaaaabb aaaaaa v1
b2 bbbbcccc bbbbbb v2
b3 ccdddddd cccccc v3
dddddd v4
})"
:inline t
(b* ((v1 (the (unsigned-byte 6) (ash (lnfix b1) -2))) ;; top 6 bits of b1
(v2h (the (unsigned-byte 2) (logand (lnfix b1) #b11))) ;; bottom 2 bits of b1
(v2l (the (unsigned-byte 4) (ash (lnfix b2) -4))) ;; top 4 bits of b2
(v2 (the (unsigned-byte 6)
(logior (the (unsigned-byte 6)
(ash (the (unsigned-byte 2) v2h) 4))
(the (unsigned-byte 4) v2l))))
(v3h (the (unsigned-byte 4) (logand (lnfix b2) #b1111))) ;; bottom 4 bits of b2
(v3l (the (unsigned-byte 2) (ash (lnfix b3) -6))) ;; top 2 bits of b3
(v3 (the (unsigned-byte 6)
(logior (the (unsigned-byte 6)
(ash (the (unsigned-byte 4) v3h) 2))
(the (unsigned-byte 2) v3l))))
(v4 (the (unsigned-byte 6) (logand (lnfix b3) #b111111)))) ;; bottom 6 bits of b3
(mv v1 v2 v3 v4))
///
(defthm unsigned-byte-p-6-of-b64-vals-from-bytes
(implies (and (force (unsigned-byte-p 8 b1))
(force (unsigned-byte-p 8 b2))
(force (unsigned-byte-p 8 b3)))
(b* (((mv v1 v2 v3 v4) (b64-vals-from-bytes b1 b2 b3)))
(and (unsigned-byte-p 6 v1)
(unsigned-byte-p 6 v2)
(unsigned-byte-p 6 v3)
(unsigned-byte-p 6 v4)))))
;; Some lemmas related to the correctness of padding:
(defthm b64-vals-from-bytes-padding-1
(b* (((mv ?v1 ?v2 ?v3 ?v4) (b64-vals-from-bytes b1 b2 0)))
(equal v4 0)))
(defthm b64-vals-from-bytes-padding-2
(b* (((mv ?v1 ?v2 ?v3 ?v4) (b64-vals-from-bytes b1 0 0)))
(equal v3 0))))
(define b64-bytes-from-vals (v1 v2 v3 v4)
(declare (type (unsigned-byte 6) v1 v2 v3 v4))
:returns (mv (b1 natp :rule-classes :type-prescription)
(b2 natp :rule-classes :type-prescription)
(b3 natp :rule-classes :type-prescription))
:parents (base64-impl)
:short "Decode 4 base-64 values into 3 bytes."
:long "<p>This is just doing the inverse of @(see b64-vals-from-bytes).</p>"
:inline t
(b* ((b1 (the (unsigned-byte 8)
(logior (the (unsigned-byte 8) (ash (lnfix v1) 2))
(the (unsigned-byte 8) (ash (lnfix v2) -4)))))
(b2 (the (unsigned-byte 8)
(logior (the (unsigned-byte 8)
(ash (the (unsigned-byte 8) (logand (lnfix v2) #b1111)) 4))
(the (unsigned-byte 8) (ash (lnfix v3) -2)))))
(b3 (the (unsigned-byte 8)
(logior (the (unsigned-byte 8)
(ash (the (unsigned-byte 8) (logand (lnfix v3) #b11)) 6))
(lnfix v4)))))
(mv b1 b2 b3))
///
(defthm unsigned-byte-p-8-of-b64-decode-4-chars
(implies (and (force (unsigned-byte-p 6 v1))
(force (unsigned-byte-p 6 v2))
(force (unsigned-byte-p 6 v3))
(force (unsigned-byte-p 6 v4)))
(b* (((mv b1 b2 b3) (b64-bytes-from-vals v1 v2 v3 v4)))
(and (unsigned-byte-p 8 b1)
(unsigned-byte-p 8 b2)
(unsigned-byte-p 8 b3)))))
(defthm b64-bytes-from-vals-of-b64-vals-from-bytes
(b* (((mv v1 v2 v3 v4) (b64-vals-from-bytes b1 b2 b3))
((mv x1 x2 x3) (b64-bytes-from-vals v1 v2 v3 v4)))
(implies (and (force (unsigned-byte-p 8 b1))
(force (unsigned-byte-p 8 b2))
(force (unsigned-byte-p 8 b3)))
(and (equal x1 b1)
(equal x2 b2)
(equal x3 b3))))
:hints(("Goal" :in-theory (enable b64-vals-from-bytes))
(acl2::equal-by-logbitp-hammer)))
;; Some corollaries related to the correctness of padding:
(defthm b64-bytes-from-vals-padding-1
(b* (((mv v1 v2 v3 ?v4) (b64-vals-from-bytes b1 b2 0))
((mv x1 x2 ?x3) (b64-bytes-from-vals v1 v2 v3 0)))
(implies (and (force (unsigned-byte-p 8 b1))
(force (unsigned-byte-p 8 b2)))
(and (equal x1 b1)
(equal x2 b2))))
:hints(("Goal"
:in-theory (disable b64-bytes-from-vals-of-b64-vals-from-bytes)
:use ((:instance b64-bytes-from-vals-of-b64-vals-from-bytes
(b3 0))))))
(defthm b64-bytes-from-vals-padding-2
(b* (((mv v1 v2 ?v3 ?v4) (b64-vals-from-bytes b1 0 0))
((mv x1 ?x2 ?x3) (b64-bytes-from-vals v1 v2 0 0)))
(implies (force (unsigned-byte-p 8 b1))
(equal x1 b1)))
:hints(("Goal"
:in-theory (disable b64-bytes-from-vals-of-b64-vals-from-bytes)
:use ((:instance b64-bytes-from-vals-of-b64-vals-from-bytes
(b2 0)
(b3 0)))))))
; ----------------------------------------------------------------------------
;
; Character List Encoding/Decoding
;
; ----------------------------------------------------------------------------
; Encoding is somewhat nicer than decoding because we don't have to worry about
; how to handle extraneous characters, etc.
(define b64-enc3 (c1 c2 c3)
(declare (type character c1 c2 c3))
:returns (mv (e1 characterp :rule-classes :type-prescription)
(e2 characterp :rule-classes :type-prescription)
(e3 characterp :rule-classes :type-prescription)
(e4 characterp :rule-classes :type-prescription))
:parents (base64-impl)
:short "Encode 3 arbitrary characters into 4 base-64 characters."
:long "<p>This is the main function for encoding, which is used for all but
perhaps the last one or two characters.</p>"
(b* ((byte1 (char-code c1))
(byte2 (char-code c2))
(byte3 (char-code c3))
((mv val1 val2 val3 val4)
(b64-vals-from-bytes byte1 byte2 byte3))
(char1 (b64-char-from-value val1))
(char2 (b64-char-from-value val2))
(char3 (b64-char-from-value val3))
(char4 (b64-char-from-value val4)))
(mv char1 char2 char3 char4)))
(define b64-enc2 (c1 c2)
(declare (type character c1 c2))
:returns (mv (e1 characterp :rule-classes :type-prescription)
(e2 characterp :rule-classes :type-prescription)
(e3 characterp :rule-classes :type-prescription))
:parents (base64-impl)
:short "Encode 2 final characters into base-64 characters."
:long "<p>This is only used if we have almost reached the end of the string
and there are exactly two characters left to encode; note that in this case we
also need to insert one explicit pad character (=).</p>"
(b* ((byte1 (char-code c1))
(byte2 (char-code c2))
((mv val1 val2 val3 &) (b64-vals-from-bytes byte1 byte2 0))
(char1 (b64-char-from-value val1))
(char2 (b64-char-from-value val2))
(char3 (b64-char-from-value val3)))
(mv char1 char2 char3)))
(define b64-enc1 (c1)
(declare (type character c1))
:returns (mv (e1 characterp :rule-classes :type-prescription)
(e2 characterp :rule-classes :type-prescription))
:parents (base64-impl)
:short "Encode 1 final character into base-64 characters."
:long "<p>This is only used if we have almost reached the end of the string
and there is exactly one character left to encode; note that in this case we
need to insert two explicit pad characters (=).</p>"
(b* ((byte1 (char-code c1))
((mv val1 val2 & &) (b64-vals-from-bytes byte1 0 0))
(char1 (b64-char-from-value val1))
(char2 (b64-char-from-value val2)))
(mv char1 char2)))
(define b64-encode-last-group ((x character-listp))
:returns (mv (e1 characterp :rule-classes :type-prescription)
(e2 characterp :rule-classes :type-prescription)
(e3 characterp :rule-classes :type-prescription)
(e4 characterp :rule-classes :type-prescription))
:guard (consp x)
:parents (base64-impl)
:short "Encode the last group of (up to three) characters."
(cond ((atom (cdr x))
;; Only one character, need two pads
(b* (((mv c1 c2) (b64-enc1 (first x))))
(mv c1 c2 #\= #\=)))
((atom (cddr x))
;; Only two characters, need one pad
(b* (((mv c1 c2 c3) (b64-enc2 (first x) (second x))))
(mv c1 c2 c3 #\=)))
(t
;; Three characters, no pads
(b64-enc3 (first x) (second x) (third x)))))
(define b64-encode-list-impl ((x character-listp)
(acc))
:returns (acc character-listp :hyp (character-listp acc))
:parents (base64-impl)
:short "Tail-recursive version of @(see base64-encode-list)."
(b* (((when (atom x))
acc)
((when (atom (cdddr x)))
(b* (((mv c1 c2 c3 c4) (b64-encode-last-group x)))
(list* c4 c3 c2 c1 acc)))
((mv c1 c2 c3 c4)
(b64-enc3 (first x) (second x) (third x)))
(acc (list* c4 c3 c2 c1 acc)))
(b64-encode-list-impl (cdddr x) acc)))
(define base64-encode-list ((x character-listp "Character list to encode."))
:returns (x-enc character-listp "Encoded version of @('x').")
:parents (base64)
:short "Base64 encode a character list."
:verify-guards nil
(mbe :logic (b* (((when (atom x))
nil)
((when (atom (cdddr x)))
(b* (((mv c1 c2 c3 c4) (b64-encode-last-group x)))
(list c1 c2 c3 c4)))
((mv c1 c2 c3 c4)
(b64-enc3 (first x) (second x) (third x))))
(append (list c1 c2 c3 c4)
(base64-encode-list (cdddr x))))
:exec (reverse (b64-encode-list-impl x nil)))
///
(defthm b64-encode-list-impl-removal
(equal (b64-encode-list-impl x acc)
(revappend (base64-encode-list x) acc))
:hints(("Goal" :in-theory (enable b64-encode-list-impl))))
(verify-guards base64-encode-list))
(define b64-dec3 (c1 c2 c3 c4)
(declare (type character c1 c2 c3 c4))
:parents (base64-impl)
:short "Decode 3 arbitrary characters from 4 base-64 characters."
:long "<p>This is the main function for decoding, which is used for all but
perhaps the last one or two characters.</p>"
:returns (mv (okp booleanp
"Decoding can fail if we encounter non Base-64 alphabetic
characters in the input."
:rule-classes :type-prescription)
(d1 characterp :rule-classes :type-prescription)
(d2 characterp :rule-classes :type-prescription)
(d3 characterp :rule-classes :type-prescription))
(b* ((code1 (char-code c1))
(code2 (char-code c2))
(code3 (char-code c3))
(code4 (char-code c4))
(val1 (b64-value-from-code code1))
(val2 (b64-value-from-code code2))
(val3 (b64-value-from-code code3))
(val4 (b64-value-from-code code4))
((unless (and val1 val2 val3 val4))
(mv nil #\0 #\0 #\0))
((mv (the (unsigned-byte 8) b1)
(the (unsigned-byte 8) b2)
(the (unsigned-byte 8) b3))
(b64-bytes-from-vals val1 val2 val3 val4))
(char1 (code-char b1))
(char2 (code-char b2))
(char3 (code-char b3)))
(mv t char1 char2 char3))
///
(defthm b64-dec3-of-b64-enc3
(implies (and (characterp c1)
(characterp c2)
(characterp c3))
(b* (((mv e1 e2 e3 e4) (b64-enc3 c1 c2 c3))
((mv okp x1 x2 x3) (b64-dec3 e1 e2 e3 e4)))
(and okp
(equal x1 c1)
(equal x2 c2)
(equal x3 c3))))
:hints(("Goal" :in-theory (enable b64-enc3)))))
(define b64-dec2 (c1 c2 c3)
(declare (type character c1 c2 c3))
:parents (base64-impl)
:short "Decode three base-64 characters to recover 2 arbitrary characters."
:long "<p>This is only used to decode the last group of base-64 characters,
when there is exactly one pad.</p>"
:returns (mv (okp booleanp
"Decoding can fail if we encounter non Base-64 alphabetic
characters in the input."
:rule-classes :type-prescription)
(d1 characterp :rule-classes :type-prescription)
(d2 characterp :rule-classes :type-prescription))
(b* ((code1 (char-code c1))
(code2 (char-code c2))
(code3 (char-code c3))
(val1 (b64-value-from-code code1))
(val2 (b64-value-from-code code2))
(val3 (b64-value-from-code code3))
((unless (and val1 val2 val3))
(mv nil #\0 #\0))
((mv (the (unsigned-byte 8) b1)
(the (unsigned-byte 8) b2)
&)
(b64-bytes-from-vals val1 val2 val3 0))
(char1 (code-char b1))
(char2 (code-char b2)))
(mv t char1 char2))
///
(defthm b64-dec2-of-b64-enc2
(implies (and (characterp c1)
(characterp c2))
(b* (((mv e1 e2 e3) (b64-enc2 c1 c2))
((mv okp x1 x2) (b64-dec2 e1 e2 e3)))
(and okp
(equal x1 c1)
(equal x2 c2))))
:hints(("Goal" :in-theory (enable b64-enc2)))))
(define b64-dec1 (c1 c2)
(declare (type character c1 c2))
:parents (base64-impl)
:short "Decode two base-64 characters to recover 1 arbitrary character."
:long "<p>This is only used to decode the last group of base-64 characters,
when there are two pads.</p>"
:returns (mv (okp booleanp
"Decoding can fail if we encounter non Base-64 alphabetic
characters in the input."
:rule-classes :type-prescription)
(d1 characterp :rule-classes :type-prescription))
(b* ((code1 (char-code c1))
(code2 (char-code c2))
(val1 (b64-value-from-code code1))
(val2 (b64-value-from-code code2))
((unless (and val1 val2))
(mv nil #\0))
((mv (the (unsigned-byte 8) b1) & &)
(b64-bytes-from-vals val1 val2 0 0))
(char1 (code-char b1)))
(mv t char1))
///
(defthm b64-dec1-of-b64-enc1
(implies (characterp c1)
(b* (((mv e1 e2) (b64-enc1 c1))
((mv okp x1) (b64-dec1 e1 e2)))
(and okp
(equal x1 c1))))
:hints(("Goal" :in-theory (enable b64-enc1)))))
(define b64-decode-last-group (c1 c2 c3 c4)
(declare (type character c1 c2 c3 c4))
:returns (mv (okp booleanp)
(ans character-listp))
:parents (base64-impl)
:short "Decode the final group of base-64 encoded characters into 1-3 characters."
(cond ((not (eql c4 #\=))
;; There was no pad, so the length was a multiple of three and
;; we really can go ahead and use the main decoder.
(b* (((mv okp char1 char2 char3) (b64-dec3 c1 c2 c3 c4)))
(mv okp (list char1 char2 char3))))
((not (eql c3 #\=))
;; There was exactly one pad, so two characters to decode.
(b* (((mv okp char1 char2) (b64-dec2 c1 c2 c3)))
(mv okp (list char1 char2))))
(t
;; There were two pads, so there should just be one character to decode.
(b* (((mv okp char1) (b64-dec1 c1 c2)))
(mv okp (list char1)))))
///
(local (defthm l1
(not (equal (mv-nth 3 (b64-enc3 c1 c2 c3)) #\=))
:hints(("Goal" :in-theory (enable b64-enc3)))))
(local (defthm l2
(not (equal (mv-nth 2 (b64-enc2 c1 c2)) #\=))
:hints(("Goal" :in-theory (enable b64-enc2)))))
(defthm b64-decode-last-group-of-b64-encode-last-group
(implies (and (character-listp x)
(consp x)
(atom (cdddr x)))
(b* (((mv c1 c2 c3 c4) (b64-encode-last-group x))
((mv okp result) (b64-decode-last-group c1 c2 c3 c4)))
(and okp
(equal result x))))
:hints(("Goal" :in-theory (enable b64-encode-last-group
b64-decode-last-group)))))
(define b64-decode-list-impl ((x character-listp)
(acc))
:returns (mv (okp booleanp :rule-classes :type-prescription)
(acc character-listp :hyp (character-listp acc)))
:parents (base64-impl)
:short "Tail-recursive version of @(see base64-decode-list)."
(b* (((when (atom x))
(mv t acc))
((when (atom (cdddr x)))
;; Less than four characters, so that's not valid at all, just fail.
(mv nil acc))
(c1 (first x))
(c2 (second x))
(c3 (third x))
(c4 (fourth x))
(rest (cddddr x))
((when (atom rest))
;; Reached the very last group. Have to think about padding.
(b* (((mv okp last) (b64-decode-last-group c1 c2 c3 c4)))
(mv okp (revappend last acc))))
;; Else, this is a normal group.
((mv okp x1 x2 x3) (b64-dec3 c1 c2 c3 c4))
((unless okp)
(mv nil acc))
(acc (list* x3 x2 x1 acc)))
(b64-decode-list-impl (cddddr x) acc)))
(define base64-decode-list ((x character-listp "Character list to decode."))
:returns (mv (okp booleanp
"Was decoding successful? It can fail if we encounter non
Base-64 alphabetic characters in the input, or if the
input is not of the proper length (a multiple of 4), or if
there is incorrect padding."
:rule-classes :type-prescription)
(ans character-listp
"On success, the decoded version of @('x'). On failure,
it is some nonsensical character list that should not be
relied on."))
:parents (base64)
:short "Base64 decode a character list."
:verify-guards nil
(mbe :logic
(b* (((when (atom x))
(mv t nil))
((when (atom (cdddr x)))
;; Less than four characters, so that's not valid at all, just fail.
(mv nil nil))
(c1 (first x))
(c2 (second x))
(c3 (third x))
(c4 (fourth x))
(rest (cddddr x))
((when (atom rest))
;; Reached the very last group. Have to think about padding.
(b64-decode-last-group c1 c2 c3 c4))
;; Else, this is a normal group.
((mv okp x1 x2 x3) (b64-dec3 c1 c2 c3 c4))
((unless okp)
(mv nil nil))
((mv rest-ok rest-ans)
(base64-decode-list (cddddr x))))
(mv (and okp rest-ok)
(list* x1 x2 x3 rest-ans)))
:exec
(b* (((mv okp acc) (b64-decode-list-impl x nil)))
(mv okp (reverse acc))))
///
(local (in-theory (enable b64-decode-list-impl)))
(local (defthm l0
(equal (mv-nth 0 (b64-decode-list-impl x acc))
(mv-nth 0 (base64-decode-list x)))))
(local (defthm l1
(equal (mv-nth 1 (b64-decode-list-impl x acc))
(revappend (mv-nth 1 (base64-decode-list x))
acc))))
(defthm b64-decode-list-impl-removal
(equal (b64-decode-list-impl x acc)
(mv (mv-nth 0 (base64-decode-list x))
(revappend (mv-nth 1 (base64-decode-list x))
acc))))
(verify-guards base64-decode-list
;; bleh, stupid hint to know it returns two values
:hints(("Goal" :in-theory (enable b64-decode-last-group))))
(defthm base64-decode-list-of-base64-encode-list
(implies (character-listp x)
(b* ((encoded (base64-encode-list x))
((mv okp decoded) (base64-decode-list encoded)))
(and okp
(equal decoded x))))
:hints(("Goal"
:induct (base64-encode-list x)
:in-theory (enable base64-encode-list
base64-decode-list)))))
; ----------------------------------------------------------------------------
;
; String Encoding/Decoding
;
; ----------------------------------------------------------------------------
(local (defsection nthcdr-lemmas
;; These aren't generally things you'd want, they're sort of
;; specialized to accessing just the first few characters from the
;; list, as the string encoder/decoder need to do...
(defthm cadr-of-nthcdr
(equal (cadr (nthcdr n x))
(nth (+ 1 (nfix n)) x)))
(local (defthm nth-of-inc2-and-list*
(implies (natp n)
(equal (nth (+ 2 n) (list* a b c))
(nth n c)))
:hints(("Goal"
:in-theory (enable nth)
:expand (nth (+ 2 n) (list* a b c))))))
(defthm caddr-of-nthcdr
(equal (caddr (nthcdr n x))
(nth (+ 2 (nfix n)) x)))
(defthm cadddr-of-nthcdr
(equal (cadddr (nthcdr n x))
(nth (+ 3 (nfix n)) x)))
(defthm cddr-nthcdr-under-iff
(implies (and (true-listp x)
(natp n))
(iff (cddr (nthcdr n x))
(< (+ 2 n) (len x)))))
(defthm cdddr-nthcdr-under-iff
(implies (and (true-listp x)
(natp n))
(iff (cdddr (nthcdr n x))
(< (+ 3 n) (len x)))))
(defthm cddddr-nthcdr-under-iff
(implies (and (true-listp x)
(natp n))
(iff (cddddr (nthcdr n x))
(< (+ 4 n) (len x)))))
(defthm cdr-nthcdr-under-iff
(implies (and (true-listp x)
(natp n))
(iff (cdr (nthcdr n x))
(< (+ 1 n) (len x)))))
(defthm cdr-nthcdr-inc2
(implies (natp n)
(equal (cdr (nthcdr (+ 2 n) x))
(cdddr (nthcdr n x))))
:hints(("Goal" :expand ((nthcdr (+ 2 n) x)))))
(defthm cdr-nthcdr-inc3
(implies (natp n)
(equal (cdr (nthcdr (+ 3 n) x))
(cddddr (nthcdr n x))))
:hints(("Goal" :expand ((nthcdr (+ 3 n) x)))))
(defthm nthcdr-of-len
(implies (true-listp x)
(equal (nthcdr (len x) x)
nil)))))
(define b64-encode-last-group-str ((x stringp)
(n natp)
(xl (eql xl (length x))))
:guard (< n xl)
:parents (base64-impl)
:short "String-based version of @(see b64-encode-last-group)."
(declare (type (integer 0 *) n xl)
(type string x))
(b* (((the (integer 0 *) left)
(mbe :logic (nfix (- (nfix xl) (nfix n)))
:exec (- xl n)))
((when (int= left 1))
(b* (((mv c1 c2) (b64-enc1 (char x n))))
(mv c1 c2 #\= #\=)))
((when (int= left 2))
(b* (((mv c1 c2 c3)
(b64-enc2 (char x n) (char x (+ 1 n)))))
(mv c1 c2 c3 #\=))))
(b64-enc3 (char x n)
(char x (+ 1 n))
(char x (+ 2 n))))
///
(defthm b64-encode-last-group-str-correct
(implies (and (force (stringp x))
(force (natp n))
(force (equal xl (length x)))
(force (< n xl)))
(equal (b64-encode-last-group-str x n xl)
(b64-encode-last-group (nthcdr n (explode x)))))
:hints(("Goal"
:in-theory (e/d (b64-encode-last-group char)
(nthcdr nth))
:do-not '(generalize fertilize)
:do-not-induct t))))
(define b64-encode-str-impl ((x stringp)
(n natp)
(xl (eql xl (length x)))
(acc))
:guard (<= n xl)
:parents (base64-impl)
:short "Efficient, string-based version of @(see b64-encode-list-impl)."
:measure (nfix (- (nfix xl) (nfix n)))
(declare (type (integer 0 *) n xl)
(type string x))
(b* (((the (integer 0 *) left)
(mbe :logic (nfix (- (nfix xl) (nfix n)))
:exec (- xl n)))
((when (zp left))
acc)
((when (<= left 3))
(b* (((mv c1 c2 c3 c4) (b64-encode-last-group-str x n xl)))
(list* c4 c3 c2 c1 acc)))
((mv c1 c2 c3 c4)
(b64-enc3 (char x n)
(char x (+ 1 n))
(char x (+ 2 n))))
(acc (list* c4 c3 c2 c1 acc)))
(b64-encode-str-impl x (+ 3 (lnfix n)) xl acc))
///
(local (defthm l0
(implies (and (stringp x)
(natp n)
(equal xl (length x))
(<= n xl))
(equal (b64-encode-str-impl x n xl acc)
(b64-encode-list-impl (nthcdr n (explode x)) acc)))
:hints(("Goal"
:induct (b64-encode-str-impl x n xl acc)
:in-theory (e/d (b64-encode-list-impl
char)
(b64-encode-list-impl-removal))
:expand ((b64-encode-str-impl x n xl acc)
(b64-encode-list-impl (nthcdr n (explode x)) acc))
:do-not '(generalize fertilize)
:do-not-induct t))))
(defthm b64-encode-str-impl-removal
(implies (and (stringp x)
(natp n)
(equal xl (length x))
(<= n xl))
(equal (b64-encode-str-impl x n xl acc)
(revappend (base64-encode-list (nthcdr n (explode x)))
acc)))
:hints(("Goal" :in-theory (disable b64-encode-str-impl)))))
(define base64-encode ((x stringp "String to be encoded."))
:returns (encoded stringp :rule-classes :type-prescription
"Encoded version of @('x').")
:parents (base64)
:short "Base64 encode a string."
(declare (type string x))
(mbe :logic (implode (base64-encode-list (explode x)))
:exec (rchars-to-string (b64-encode-str-impl x 0 (length x) nil))))
(define base64-revappend-encode
((x stringp "String to be encoded.")
(acc "Accumulator for encoded characters (in reverse order)."))
:enabled t
:parents (base64)
:short "Efficient @('(revappend-chars (base64-encode x) acc)')."
:long "<p>We leave this enabled; it would be odd to reason about it.</p>"
:prepwork ((local (in-theory (enable base64-encode revappend-chars))))
(declare (type string x))
(mbe :logic (revappend-chars (base64-encode x) acc)
:exec (b64-encode-str-impl x 0 (length x) acc)))
(define b64-decode-str-impl ((x stringp)
(n natp)
(xl (equal xl (length x)))
(acc))
:guard (<= n xl)
:measure (nfix (- (nfix xl) (nfix n)))
:returns (mv (okp booleanp :rule-classes :type-prescription)
(acc character-listp :hyp (character-listp acc)))
:parents (base64-impl)
:short "Efficient, string-based version of @(see b64-decode-list-impl)."
(declare (type (integer 0 *) n xl)
(type string x))
(b* (((the (integer 0 *) left)
(mbe :logic (nfix (- (nfix xl) (nfix n)))
:exec (- xl n)))
((when (zp left))
(mv t acc))
((when (< left 4))
;; Less than four characters, so that's not valid at all, just fail.
(mv nil acc))
(c1 (char x n))
(c2 (char x (+ 1 n)))
(c3 (char x (+ 2 n)))
(c4 (char x (+ 3 n)))
((when (int= left 4))
;; Reached the very last group. Have to think about padding.
(b* (((mv okp last) (b64-decode-last-group c1 c2 c3 c4)))
(mv okp (revappend last acc))))
;; Else, this is a normal group.
((mv okp x1 x2 x3) (b64-dec3 c1 c2 c3 c4))
((unless okp)
(mv nil acc))
(acc (list* x3 x2 x1 acc)))
(b64-decode-str-impl x (+ 4 (lnfix n)) xl acc))
///
(local (defthm l0
(implies (and (stringp x)
(natp n)
(equal xl (length x))
(<= n xl))
(equal (b64-decode-str-impl x n xl acc)
(b64-decode-list-impl (nthcdr n (explode x)) acc)))
:hints(("Goal"
:induct (b64-decode-str-impl x n xl acc)
:in-theory (e/d (b64-decode-list-impl char)
(b64-decode-list-impl-removal))
:expand ((b64-decode-str-impl x n xl acc)
(b64-decode-list-impl (nthcdr n (explode x)) acc))
:do-not '(generalize fertilize)
:do-not-induct t))))
(defthm b64-decode-str-impl-removal
(implies (and (stringp x)
(natp n)
(equal xl (length x))
(<= n xl))
(equal (b64-decode-str-impl x n xl acc)
(let ((chars (nthcdr n (explode x))))
(mv (mv-nth 0 (base64-decode-list chars))
(revappend (mv-nth 1 (base64-decode-list chars))
acc)))))
:hints(("Goal" :in-theory (disable b64-decode-str-impl)))))
(define base64-decode
((x stringp "String to be decoded."))
:returns (mv (okp booleanp
"Was decoding successful? It can fail if we encounter non
Base-64 alphabetic characters in the input, or if the
input is not of the proper length (a multiple of 4), or if
there is incorrect padding."
:rule-classes :type-prescription)
(ans stringp
"On success, the decoded version of @('x'). On failure,
it is some nonsensical string that should not be relied
on."
:rule-classes :type-prescription))
:parents (base64)
:short "Base64 decode a string."
(declare (type string x))
(mbe :logic
(b* (((mv okp chars)
(base64-decode-list (explode x))))
(mv okp (implode chars)))
:exec
(b* (((mv okp rchars)
(b64-decode-str-impl x 0 (length x) nil)))
(mv okp (rchars-to-string rchars))))
///
(defthm base64-decode-of-base64-encode
(equal (base64-decode (base64-encode x))
(mv t (if (stringp x)
x
"")))
:hints(("Goal" :in-theory (enable base64-encode
base64-decode)))))
(define base64-revappend-decode
((x stringp "String to be decoded.")
(acc "Accumulator for decoded characters (in reverse order)."))
:returns (mv (okp "Was decoding successful?")
(acc))
:enabled t
:parents (base64)
:short "Efficiently revappend the characters from @(see base64-decode) onto
an accumulator."
:long "<p>We leave this enabled; it would be odd to reason about it.</p>"
:prepwork ((local (in-theory (enable base64-decode revappend-chars))))
:guard-debug t
(declare (type string x))
(mbe :logic
(b* (((mv okp str) (base64-decode x)))
(mv okp (revappend-chars str acc)))
:exec
(b64-decode-str-impl x 0 (length x) acc)))
;; Test vectors from RFC 4648, Section 10.
(local
(progn
(assert! (equal (base64-encode "") ""))
(assert! (equal (base64-encode "f") "Zg=="))
(assert! (equal (base64-encode "fo") "Zm8="))
(assert! (equal (base64-encode "foo") "Zm9v"))
(assert! (equal (base64-encode "foob") "Zm9vYg=="))
(assert! (equal (base64-encode "fooba") "Zm9vYmE="))
(assert! (equal (base64-encode "foobar") "Zm9vYmFy"))
(define base64-decode-easy ((x stringp))
(b* (((mv ok orig) (base64-decode x))
((unless ok)
(cutil::raise "Whoops")
""))
orig))
(assert! (equal "" (base64-decode-easy "")))
(assert! (equal "f" (base64-decode-easy "Zg==")))
(assert! (equal "fo" (base64-decode-easy "Zm8=")))
(assert! (equal "foo" (base64-decode-easy "Zm9v")))
(assert! (equal "foob" (base64-decode-easy "Zm9vYg==")))
(assert! (equal "fooba" (base64-decode-easy "Zm9vYmE=")))
(assert! (equal "foobar" (base64-decode-easy "Zm9vYmFy")))))
|