-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathchars.lisp
847 lines (774 loc) · 35.4 KB
/
chars.lisp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
;;; :FILE mon-systems/chars.lisp
;;; ==============================
;;; ==============================
;;; :NOTE Following are teh SBCL internals notes re the implementation of :SB-UNICODE
;;; :SOURCE (URL `http://www.sbcl.org/sbcl-internals/Character-and-String-Types.html#Character-and-String-Types')
;;
;; The :SB-UNICODE feature implies support for all 1114112 potential characters in
;; the character space defined by the Unicode consortium, with the identity mapping
;; between lisp char-code and Unicode code point. SBCL releases before version
;; 0.8.17, and those without the :SB-UNICODE feature, support only 256 characters,
;; with the identity mapping between char-code and Latin1 (or, equivalently, the
;; first 256 Unicode) code point.
;;
;; In the absence of the :SB-UNICODE feature, the types base-char and character are
;; identical, and encompass the set of all 256 characters supported by the
;; implementation. With the :SB-UNICODE on *features* (the default), however,
;; base-char and character are distinct: character encompasses the set of all
;; 1114112 characters, while base-char represents the set of the first 128
;; characters.
;; The effect of this on string types is that an sbcl configured with :SB-UNICODE
;; has three disjoint string types: (vector nil), base-string and (vector
;; character). In a build without :SB-UNICODE, there are two such disjoint types:
;; (vector nil) and (vector character); base-string is identially equal to (vector
;; character).
;;
;; The SB-KERNEL:CHARACTER-SET-TYPE represents possibly noncontiguous sets of
;; characters as lists of range pairs: for example, the type standard-char is
;; represented as the type (sb-kernel:character-set '((10 . 10) (32 . 126)))
;;; ==============================
;;
;;; :NOTE :FILE sbcl/src/code/octets.lisp defines the character conversion routines
;;; :SEE comments beginning around: `define-unibyte-mapper'
;; ,----
;; | to-octets conversions
;; |
;; | to latin (including ascii)
;; |
;; | Converting bytes to character codes is easy: just use a 256-element
;; | lookup table that maps each possible byte to its corresponding
;; | character code.
;; |
;; | Converting character codes to bytes is a little harder, since the
;; | codes may be spare (e.g. we use codes 0-127, 3490, and 4598).
;; | {...}
;; `----
;; :INTERNAL
;; `define-unibyte-mapper', `define-latin->string*', `string->latin%',
;; `get-latin-bytes', `define-latin->string*', `define-latin->string',
;; `sb-impl::*default-external-format*', `default-external-format'
;;
;; :PUBLIC
;; `octets-to-string', `string-to-octets', `+unicode-replacement-character+',
;; `use-unicode-replacement-char', `with-standard-replacement-character',
;; `with-default-decoding-replacement',
;;
;; +unicode-replacement-character+ ;; sb-impl::+unicode-replacement-character+
;; with-default-decoding-replacement ;; sb-impl::with-default-decoding-replacement
;; with-standard-replacement-character ;; sb-impl::with-standard-replacement-character
;;
;; (string-to-octets "bubba")
;; ;=> #(98 117 98 98 117)
;; (octets-to-string (make-array 3 :element-type '(unsigned-byte 8)
;; :initial-contents '(32 59 102)))
;; => " ;f"
;; stringstring-coerce-from
;;; ==============================
;;
;; ,----
;; |
;; | 10.2 Reader and Printer
;; |
;; | The `"' reader macro always constructs an object of type `(simple-array
;; | character)', even if all of the characters within the quotation marks
;; | are of type `base-char'. This implies that only strings of type
;; | `(vector character)' will be able to be printed when `*print-readably*'
;; | is true: attempting to print strings of other types will cause an error
;; | of type `print-not-readable'.
;; |
;; `---- :SEE info node `(sbcl-internals)Reader and Printer'
;;
;;; ==============================
(in-package #:mon)
;; *package*
(declaim (inline whitespace-char-p))
(defun whitespace-char-p (maybe-wsp-char)
(declare (optimize (speed 3)))
(when (characterp maybe-wsp-char)
(the boolean
(typep maybe-wsp-char 'whitespace-char))))
;; :WAS
;; (or (member maybe-wsp-char *whitespace-chars* :test #'char=)
;; :NOTE #\space is considered to be `graphic-char-p' and is in fact its lower bounds.
;; (not (graphic-char-p maybe-wsp-char))))
(declaim (inline char-not-whitespace-char-p))
(defun char-not-whitespace-char-p (maybe-not-whitespace-char)
(declare (optimize (speed 3)))
(the boolean
(typep maybe-not-whitespace-char 'char-not-whitespace-char)))
(declaim (inline hexadecimal-char-p))
(defun hexadecimal-char-p (maybe-hex-char)
(declare (optimize (speed 3)))
(the boolean
(typep maybe-hex-char 'hexadecimal-char)))
(defun char-code-integer-to-string (char-code-int &key stream) ;;&optional stream)
(declare (type char-code-integer char-code-int)
(stream-or-boolean stream))
#-sbcl (assert (char-code-integer-p char-code-int))
;; :NOTE Using `mon:open-stream-output-stream-p' instead:
(and stream (open-stream-output-stream-p stream :allow-booleans t :w-error t))
(or
(and stream (write-string (string (the character (code-char char-code-int))) stream))
(string (the character (code-char char-code-int)))))
;; string-split-on-chars, char-list-to-string
(defun char-to-string (char &key stream (allow-integers t))
(declare (type (or char-code-integer character) char)
(boolean allow-integers)
(stream-or-boolean stream))
;; :WAS (and stream (or (and (streamp stream) (open-stream-p stream)) (error 'stream-error)))
;; :NOTE Use `mon:open-stream-output-stream-p' instead:
(and stream (open-stream-output-stream-p stream :allow-booleans t :w-error t))
(etypecase char
(char-code-integer (if allow-integers
(char-code-integer-to-string char :stream stream)
(error 'type-error :datum char :expected-type 'character)))
;; simple-type-error (where-is "simple-type-error")
(character (or (and stream (write-string (string char) stream))
(string char)))))
(declaim (inline %char-code-integer-to-char-if))
(defun %char-code-integer-to-char-if (char-or-char-code-integer)
(declare (char-code-integer char-or-char-code-integer)
(optimize (speed 3)))
(code-char char-or-char-code-integer))
(defun char-code-integer-to-char (char-or-char-code-integer &key w-no-error)
(declare (inline
char-or-char-code-integer-p
%char-code-integer-to-char-if)
(boolean w-no-error)
(optimize (speed 3)))
(typecase char-or-char-code-integer
(character char-or-char-code-integer)
(char-code-integer (%char-code-integer-to-char-if char-or-char-code-integer))
(t (if w-no-error
char-or-char-code-integer
(simple-error-mon
:w-sym 'char-code-integer-to-char
:w-type 'function
:w-spec "arg CHAR-OR-CHAR-CODE-INTEGER neither `cl:characterp' ~
nor `mon:char-code-integer-p'"
:w-got char-or-char-code-integer
:w-type-of t
:signal-or-only nil)))))
(declaim (inline %char-coerce-string-of-length-1-if))
(defun %char-coerce-string-of-length-1-if (string-of-length-1)
(declare (string-of-length-1 string-of-length-1)
(inline char-code-integer-p)
(optimize (speed 3)))
;; :NOTE In neither case clause should schar/char 0 ever be a non
;; char-code-integer happen and will likely never happen with objects of type
;; simple-string-of-length-1 however, it is conceivable for it to occure with
;; objects of type string-of-length-1.
(etypecase string-of-length-1
(simple-string-of-length-1
(let ((get-char (schar (the simple-string-of-length-1 string-of-length-1) 0)))
(or
(and (char-code-integer-p (char-code get-char)) get-char)
(error "The CL:SCHAR at index 0 not of type `mon:char-code-integer'~% ~
got: ~S~%" string-of-length-1))))
(string-of-length-1
(let ((get-char (char (the string-of-length-1 string-of-length-1) 0)))
(or
(and (char-code-integer-p (char-code get-char)) get-char)
(error "The CL:CHAR at index 0 not of type `mon:char-code-integer'~% ~
got: ~S~%" string-of-length-1))))))
(defun char-or-char-code-integer-or-string-1-ensure-char (char-or-char-code-integer-or-string-1)
(declare (char-or-char-code-integer-or-string-1 char-or-char-code-integer-or-string-1)
(inline %char-code-integer-to-char-if
%char-coerce-string-of-length-1-if)
(optimize (speed 3)))
;; #-sbcl (assert (char-or-char-code-integer-or-string-1
(etypecase char-or-char-code-integer-or-string-1
(character char-or-char-code-integer-or-string-1)
(char-code-integer (%char-code-integer-to-char-if char-or-char-code-integer-or-string-1))
(simple-string-of-length-1
(%char-coerce-string-of-length-1-if
(the simple-string-of-length-1 char-or-char-code-integer-or-string-1)))
(string-of-length-1
(%char-coerce-string-of-length-1-if
(the string-of-length-1 char-or-char-code-integer-or-string-1)))))
(defun char-numeric= (char-x char-y)
(declare ;((or character char-code-integer) char-x char-y)
(char-or-char-code-integer char-x char-y)
;; inlining %char-numeric= is bad don't do it!
(optimize (speed 3) (safety 1)))
(values-list
(etypecase char-x
(character
(etypecase char-y
(character (or (and (zerop (%char-numeric= char-x
char-y))
(list t char-x))
(list nil char-x char-y)))
(char-code-integer (or (and (zerop (%char-numeric= char-x (code-char char-y)))
(list t char-x))
(list nil char-x (code-char char-y))))))
(char-code-integer
(etypecase char-y
(char-code-integer (or (and (zerop (logxor char-x char-y))
(list t (code-char char-x)))
(list nil (code-char char-x) (code-char char-y))))
(character (or (and (zerop (logxor char-x (char-code char-y)))
(list t char-y))
(list nil (code-char char-x) char-y))))))))
(defun char-list-to-string (char-list &optional stream)
(declare (type list char-list)
(stream-or-boolean stream))
;; :WAS (and stream (or (and (streamp stream) (open-stream-p stream)) (error 'stream-error)))
;; :NOTE Using `mon:open-stream-output-stream-p' instead:
(and stream (open-stream-output-stream-p stream :allow-booleans t :w-error t))
(when
(etypecase char-list
(each-a-character-or-char-code-integer t)
(each-a-character t)
(each-a-char-code-integer t))
(with-open-stream (msos (make-string-output-stream))
(loop
:for chars :in char-list
:do (char-to-string chars :allow-integers t :stream msos)
:finally (return (if stream
(values (write-string (get-output-stream-string msos) stream)
(length char-list))
(get-output-stream-string msos)
))))))
(defun char-position (w-char in-string &optional (start-idx 0) (max-idx (length in-string)))
(declare (type string in-string)
(type character w-char))
(do* ((i start-idx (1+ i)))
((= i max-idx) nil)
(when (char= w-char (char in-string i)) (return i))))
(defun chars-not-in-string-p (char-bag string &key (test #'char=))
(declare (type string string)
(type proper-list-not-null char-bag))
(loop
:named bail-if
:for fnd-char :across string
:for pos :below (length string)
:do (loop
:for chk-chars :in char-bag
:when (funcall test chk-chars fnd-char)
:do (return-from bail-if (values nil pos)))
:finally (return-from bail-if t)))
;;
(declaim (inline max-char))
(defun max-char ()
(declare (optimize (speed 3)))
char-code-limit)
(declaim (inline ascii-char-p))
(defun ascii-char-p (c)
(declare (optimize (speed 3)))
(when (characterp c)
(the boolean
(<= (char-code (the character c)) 127))))
(declaim (inline ascii-string-p))
(defun ascii-string-p (string)
;; Allow STRING arg to be anything then filter out everything w/ string-not-null-p
;; (every #'ascii-char-p ())
;; (every #'ascii-char-p "")
;; (every #'ascii-char-p "í")
(declare (inline string-not-null-p ascii-char-p)
(optimize (speed 3)))
(when (string-not-null-p string)
(locally
(declare (string-not-null string))
(etypecase string
(simple-string (the boolean (every #'ascii-char-p (the simple-string string))))
(string (the boolean (every #'ascii-char-p (the string string))))))))
(declaim (inline ascii-simple-string-p))
(defun ascii-simple-string-p (string)
(declare (inline ascii-string-p)
(optimize (speed 3)))
(the boolean
(typep string 'simple-ascii-string)))
(defun ascii-downcase (char-w-code)
(declare (optimize (speed 3)))
(let ((cwc
(etypecase char-w-code
((unsigned-byte 7) char-w-code)
(standard-char (char-code (the standard-char char-w-code)))
(char-code-integer (return-from ascii-downcase
(values (the char-code-integer char-w-code) nil)))
(character
(return-from ascii-downcase (values (char-code char-w-code) nil))))))
(values-list
(or (and (<= 65 (the char-code-integer cwc) 90)
(list (+ (the (unsigned-byte 7) cwc) 32) t))
(list cwc nil)))))
(defun ascii-equal (char-a char-b)
(declare (inline ascii-char-p)
(optimize (speed 3)))
(when (and (ascii-char-p char-a)
(ascii-char-p char-b))
(the boolean
(eql (ascii-downcase char-a)
(ascii-downcase char-b)))))
;;; :SOURCE chunga-1.1.1/read.lisp :WAS `controlp'
;;; What about an alias for `control-char-p'?
(declaim (inline ascii-control-p))
(defun ascii-control-p (char)
(declare (optimize (speed 3)))
(when (characterp char)
(the boolean
(or (<= 0 (char-code (the character char)) 31)
(= (char-code (the character char)) 127)))))
(declaim (inline latin-1-char-p))
(defun latin-1-char-p (char)
(declare (optimize (speed 3)))
(when (characterp char)
(the boolean
(<= (char-code (the character char)) 255))))
;; (and (notany #'characterp "") (every #'characterp "")) ;=> t
;;
;; ascii-string-p
;; (type-of (coerce "0123456789abcdef" 'simple-base-string)) => (SIMPLE-BASE-STRING 16)
;;
;; (aref (the (SIMPLE-BASE-STRING 16) (coerce "0123456789abcdef" 'simple-base-string)) 3)
;;
;;; :NOTE :SEE :FILE mon-systems/arrays.lisp `string-ascii-to-byte-array'
;;; :SEE :FILE mon-systems/types.lisp `simple-iso-latin-1-string'
(defun latin-1-string-p (string)
(declare (inline string-empty-p
simple-string-empty-p
latin-1-char-p)
(optimize (speed 3)))
(when (stringp string)
(locally
(declare (string string))
(etypecase string
(simple-string
(the boolean
(or (simple-string-empty-p (the simple-string string))
(every #'latin-1-char-p (the simple-string string)))))
(string
(the boolean
(or (string-empty-p string)
(every #'latin-1-char-p string))))))))
(defun latin-1-simple-string-p (string)
(declare (optimize (speed 3)))
(when (stringp string)
(when (simple-string-p (the string string))
(latin-1-string-p (the simple-string string)))))
;; :SOURCE slime-20101207-cvs/swank.lisp :WAS `casify-char'
(defun char-invert-case-maybe (char-to-invert &key (case :preserve))
(declare (type character char-to-invert))
(unless (memq case '(:preserve :upcase :downcase :invert))
(setf case :preserve))
;; :WAS (ecase (readtable-case *readtable*)
(case case
(:preserve char-to-invert)
(:upcase (char-upcase char-to-invert))
(:downcase (char-downcase char-to-invert))
(:invert (if (upper-case-p char-to-invert)
(char-downcase char-to-invert)
(char-upcase char-to-invert)))))
(defun char-for-readtable-case (case-frob-char &optional readtable)
(declare (type character case-frob-char)
((or null readtable) readtable))
(string-invert-case case-frob-char
:case (or
(and readtable
(or
(and (readtablep readtable)
(readtable-case readtable))
(simple-error-mon :w-sym 'match-readtable-case
:w-type 'function
:w-spec "arg READTABLE not `readtablep'"
:w-got readtable
:w-type-of readtable
:signal-or-only nil)))
(readtable-case (or readtable *readtable*)))))
(defun char-ascii-table (&key case)
;; :NOTE Yes, we know there are more elegant ways to do this!
(ecase case
(:lower
(loop
for x from 97 below 123
and y from 1 below 27
collect (cons y (char-code-integer-to-string x))))
(:upper
(loop
for x from 65 below 91
and y from 1 below 27
collect (cons y (char-code-integer-to-string x))))
(:lower-upper
(loop
for lx from 97 below 123
for ux from 65 below 91
and ly from 1 to 27
and uy from 27 to 52
collect (cons uy (char-code-integer-to-string ux)) into rtn
collect (cons ly (char-code-integer-to-string lx)) into gthr
finally (return (append gthr rtn ))))
(:upper-lower
(loop
for ux from 65 below 91
for lx from 97 below 123
and uy from 1 to 27
and ly from 27 to 52
collect (cons uy (char-code-integer-to-string ux)) into rtn
collect (cons ly (char-code-integer-to-string lx)) into gthr
finally (return (append rtn gthr))))))
#+sbcl
(defun char-length (mb-char)
;; :NOTE what about `char-or-char-code-integer'?
(declare
((or character code-point) mb-char)
(optimize (speed 3)))
(sb-impl::char-len-as-utf8
(etypecase mb-char
(code-point mb-char)
(character (char-code mb-char)))))
;; (sb-impl::string->utf8 "►" 0 1 0)
;; => #(226 150 186)
;; (char-length
;;
;; (sb-impl::string->utf8 "abcÿ►◄λ" 0 3 0)
;; (ironclad:ascii-string-to-byte-array "abcÿ")
;; => #(97 98 99 255)
;; (length "abcÿ")
;; #xc3
;; :SOURCE mccme-helpers/packages:file mccme-helpers/parsetype
;; :WAS `escape-char-unicode-octochar'
(defun char-escape-as-unicode-octochar-string (char-to-escape)
(declare (character char-to-escape))
(format nil "\\U~8,'0x" (char-code char-to-escape)))
;; :SOURCE mccme-helpers/packages:file mccme-helpers/parsetype
;; :WAS `escape-unicode-long'
(defun string-escape-as-unicode-octo-chars (string-to-escape)
(declare (type string string-to-escape))
(apply 'concatenate 'string
(map 'list 'char-escape-as-unicode-octochar-string string-to-escape)))
;;; ==============================
;;; :CHARS-DOCUMENTATION
;;; ==============================
(fundoc 'char-numeric=
"Whether CHAR-X and CHAR-Y are numerically equal.~%~@
CHAR-X and CHAR-Y are each either of type `cl:character' or
`mon:char-code-integer', an error is signaled if not.~%~@
Return value is as if by `cl:values'.~%~@
When codepoints of CHAR-X and CHAR-Y are numerically = return value has the form:~%
T, <CHARACTER-X|Y>~%~@
When codepoints of CHAR-X and CHAR-Y are not numerically =, return value has form:~%
T, CHARACTER-X, CHARACTER-Y~%~@
In either case the above syntax <CHARACTER-*> indicates that return value is a
character designator produced as if by `cl:code-char' e.g.:~%~@
\(code-char 9658\)
=> #\BLACK_RIGHT-POINTING_POINTER~%~@
:EXAMPLE~%
\(char-numeric= #\\► 9658\)~%
\(char-numeric= 9658 9658\)~%
\(char-numeric= 9658 #\\►\)~%
\(char-numeric= #\\◄ #\\►\)~%
\(char-numeric= 9657 #\\►\)~%
\(char-numeric= 9657 9658\)~%
\(char-numeric= 9657 9658\)~%~@
:SEE-ALSO `<XREF>'.~%▶▶▶")
(fundoc 'ascii-downcase
"Return as if by `cl:values' the downcased `cl:char-code' of ASCII CHAR-W-CODE.~%~@
CHAR-W-CODE is a character or integer of type `mon:char-code-integer'.~%~@
Second value is t when CHAR-W-CODE was returned as a downcased value.~%~@
:EXAMPLE~%
\(ascii-downcase 88\)~%
\(ascii-downcase #\\X\)~%
\(ascii-downcase #\\►\)~%
\(ascii-downcase 233\)~%~@
:SEE-ALSO `mon:*whitespace-chars*', `mon:whitespace-char-p',
`mon:ascii-downcase', `mon:ascii-downcase', `mon:ascii-char-p',
`mon:ascii-string-p'.~%▶▶▶")
(fundoc 'ascii-equal
"Return non-nil when CHAR-A and CHAR-B are `cl:eql' ASCII chars.~%~@
To account for case wrt the lisp reader comparison is made by first downcasing both
CHAR-A and CHAR-B before testing for `cl:eql'.~%~@
:EXAMPLE~%
\(ascii-equal #\\a #\\a\)
\(ascii-equal #\\A #\\A\)
\(ascii-equal #\\A #\\a\)
\(ascii-equal #\\a #\\A\)~%~@
:SEE-ALSO :SEE-ALSO `mon:whitespace-char-p' `mon:ascii-string-p',
`mon:ascii-char-p', `mon:ascii-downcase', `mon:ascii-equal',
`mon:ascii-control-p', `mon:latin-1-char-p', `mon:latin-1-string-p'.~%▶▶▶")
(fundoc 'ascii-string-p
"Whether every character in the simple-string STRING is `mon:ascii-char-p'.~%~@
:EXAMPLE~%
\(ascii-string-p \"aeEiou\"\)
\(ascii-string-p \"àéÉíóü\"\)~%~@
:SEE info node `(ansicl)Character Syntax'~%~@
:SEE-ALSO `mon:whitespace-char-p' `mon:ascii-string-p', `mon:ascii-char-p',
`mon:ascii-downcase', `mon:ascii-equal', `mon:ascii-control-p',
`mon:latin-1-char-p', `mon:latin-1-string-p'.~%▶▶▶")
(fundoc 'ascii-char-p
"Whether character C is `cl:characterp' with char-codeless than or equal to 127.~%~@
:EXAMPLE~%
\(ascii-char-p \"E\"\)~%
\(ascii-char-p \"É\"\)~%~@
:SEE info node `(ansicl)Character Syntax'~%~@
:SEE-ALSO `mon:whitespace-char-p' `mon:ascii-string-p', `mon:ascii-char-p',
`mon:ascii-downcase', `mon:ascii-equal', `mon:ascii-control-p',
`mon:latin-1-char-p', `mon:latin-1-string-p'.~%▶▶▶")
(fundoc 'ascii-control-p
"Whether CHAR is characterp and a control character according to RFC 2616.~%~@
This is the range of ASCII characters in the range 0-31 and 127.~%~@
:EXAMPLE~%
\(ascii-control-p #\\DC1\)~%
\(ascii-control-p #\\US\)~%
\(ascii-control-p #\\NEWLINE\)~%
\(ascii-control-p #\\DEL\)~%
\(ascii-control-p #\\SPACE\)~%~@
:SEE info node `(ansicl)Standard Characters'~%~@
:SEE-ALSO `mon:whitespace-char-p', `mon:char-length', `mon:ascii-char-p',
`mon:ascii-string-p', `mon:ascii-equal', `mon:ascii-downcase',
`mon:*whitespace-chars*', `mon:latin-1-char-p', `mon:latin-1-string-p'.~%▶▶▶")
(fundoc 'latin-1-char-p
"Whether character C is `cl:characterp' with char-codeless than or equal to 255.~%~@
:EXAMPLE~%
\(latin-1-char-p \"É\"\)~%
\(latin-1-char-p \"E\"\)~%
\(ascii-char-p \"E\"\)~%
\(ascii-char-p \"É\"\)~%~@
:SEE info node `(ansicl)Character Syntax'~%~@
:SEE-ALSO `mon:whitespace-char-p' `mon:ascii-string-p', `mon:ascii-char-p',
`mon:ascii-downcase', `mon:ascii-equal', `mon:ascii-control-p',
`mon:latin-1-char-p', `mon:latin-1-string-p'.~%▶▶▶")
(fundoc 'latin-1-string-p
"Whether every character in the simple-string STRING is `mon:latin-1-char-p'.~%~@
:EXAMPLE~%
\(latin-1-string-p \"àéÉíóü\"\)~%
\(ascii-string-p \"àéÉíóü\"\)~%~@
:SEE-ALSO `mon:whitespace-char-p' `mon:ascii-string-p', `mon:ascii-char-p',
`mon:ascii-downcase', `mon:ascii-equal', `mon:ascii-control-p'.~%▶▶▶")
(fundoc 'whitespace-char-p
"Return non-nil when char is a member of `*whitespace-chars*'~%~@
:EXAMPLE~%
\(whitespace-char-p #\\a\)~%
\(whitespace-char-p #\\tab\)~%~@
:SEE info node `(ansicl)Character Syntax'~%~@
:SEE-ALSO
`cl:base-char-p', `cl:char-code-integer', `cl:char-code-limit' `cl:char-code',
`cl:code-char', `cl:char-name', `cl:name-char', `cl:char-upcase', `cl:char-downcase',
`cl:char-int', `cl:schar', `cl:digit-char', `cl:character', `cl:base-char', `cl:standard-char',
`cl:extended-char',`cl:standard-char-p', `cl:graphic-char-p',
`cl:alpha-char-p',`cl:digit-char-p', `cl:alphanumericp', `cl:upper-case-p', `cl:lower-case-p',
`cl:both-case-p', `cl:char=', `cl:char/=', `cl:char<', `cl:char>', `cl:char<=', `cl:char>=',
`cl:char-equal', `char-not-equal'.~%▶▶▶")
(fundoc 'char-not-whitespace-char-p
"Whether MAYBE-NOT-WHITESPACE-CHAR is of type `mon:char-not-whitespace-char'.~%~@
:EXAMPLE~%
\(char-not-whitespace-char-p #\\a\)~%
\(char-not-whitespace-char-p #\\Tab\)
\(funcall \(complement #'char-not-whitespace-char-p\) #\\Tab\)
\(notany #'char-not-whitespace-char-p *whitespace-chars*\)
:SEE-ALSO `mon:whitespace-char', `mon:whitespace-char-p',
`mon:*whitespace-chars*'.~%▶▶▶")
(fundoc 'hexadecimal-char-p
"Whether MAYBE-HEX-CHAR is of type `mon:hexadecimal-char'~%~@
:EXAMPLE~%
\(hexadecimal-char-p #\\f\)~%
\(hexadecimal-char-p #\\F\)~%
\(hexadecimal-char-p #\\G\)~%
\(hexadecimal-char-p #\\0\)~%~@
:SEE-ALSO `mon:*hexadecimal-chars*', `mon:whitespace-char-p', `cl:base-char-p',
`cl:char-code-integer', `cl:char-code-limit' `cl:char-code', `cl:code-char',
`cl:char-name', `cl:name-char', `cl:char-upcase', `cl:char-downcase',
`cl:char-int', `cl:schar', `cl:digit-char', `cl:character', `cl:base-char',
`cl:standard-char', `cl:extended-char',`cl:standard-char-p',
`cl:graphic-char-p', `cl:alpha-char-p',`cl:digit-char-p', `cl:alphanumericp',
`cl:upper-case-p', `cl:lower-case-p', `cl:both-case-p', `cl:char=', `cl:char/=',
`cl:char<', `cl:char>', `cl:char<=', `cl:char>=', `cl:char-equal',
`char-not-equal'.~%▶▶▶")
;; When optional arg stream is provided it should satisfy `streamp' and `open-stream-p'.
;; Signal an error if not.~%~@
(fundoc 'chars-not-in-string-p
"Return T when none of the characters in CHAR-BAG are in STRING.~%~@
If a character in CHAR-BAG is in STRING return as if by vaules with first value
null and second the position of the character in STRING.~%~@
CHAR-BAG is a proper-list with each element satisfying `cl:characterp'.
STRING is a string.~%~@
Keyword :TEST is a function accepting one arg which returns non-nil when a
character in CHAR-BAG is present in STRING. Default is `cl:char='.~%~@
:EXAMPLE~%
\(chars-not-in-string-p '\(#\\Q #\\E #\\D\) \"#package.\"\)~%
\(chars-not-in-string-p '\(#\\Q #\\E #\\D\) \"#package.\" :test #'char-equal\)~%
\(chars-not-in-string-p '\(#\\# #\\E #\\.\) \"#package.\"\)~%~@
:SEE-ALSO `<XREF>'.~%▶▶▶")
(fundoc 'char-to-string
"Convert CHAR to a string containing that character.~%~@
CHAR may be of type `cl:character'.
When ALLOW-INTEGERS is non-nil CHAR may also be of type `mon:char-code-integer'.~%~@
Keyword STREAM is provided return output to STREAM.
It should satisfy `streamp' and `open-stream-p' Signal an error if not.~%~@
Keyword ALLOW-INTEGERS is a boolean it defaults to T.
When ALLOW-INTEGERS is true, if CHAR satisfies mon:char-code-integer-p it will
be converted to a string as if by `mon:char-code-integer-to-string', if not a
`cl:type-error' condition is signaled.~%~@
:EXAMPLE~%
\(char-to-string #\\a\)~%
\(char-to-string 97 :allow-integers t\)~%
\(with-open-stream \(s \(make-string-output-stream\)\)
\(char-to-string 97 :stream s :allow-integers t\)
\(char-to-string #\\\\b :stream s\)
\(char-to-string 99 :stream s :allow-integers t\)
\(get-output-stream-string s\)\)~%~@
:EMACS-LISP-COMPAT~%~@
:SEE-ALSO `char-list-to-string', `string-to-char', `string-to-number',
`char-code-limit' `char-code', `code-char', `char-name', `name-char',
`char-upcase', `char-downcase', `char-int', `schar', `digit-char', `character',
`base-char', `standard-char', `extended-char',`standard-char-p',
`graphic-char-p', `alpha-char-p',`digit-char-p', `alphanumericp',
`upper-case-p', `lower-case-p', `both-case-p', `char=', `char/=', `char<',
`char>', `char<=', `char>=', `char-equal', `char-not-equal+'.~%▶▶▶")
(fundoc 'char-code-integer-to-string
"Convert CHAR-CODE-INT to string.~%~@
CHAR-CODE-INT should satisfy `mon:char-code-integer-p'.
Signal an error if not.~%~@
When optional arg stream is provided it should satisfy `streamp' and `open-stream-p'.
Signal an error if not.~%~@
:EXAMPLE~%
\(char-code-integer-to-string 9658\)~%
;; Following signals an error:~%
\(char-code-integer-to-string -1\)~%~@
:SEE-ALSO `mon:char-code-integer-p', `mon:char-code-integer-to-string',
`mon:char-to-string', `char-list-to-string', `mon:char-code-integer',
`mon:char-or-char-code-integer-or-string-1-ensure-char'.~%▶▶▶")
(fundoc 'char-code-integer-to-char
"Convert CHAR-CODE-INTEGER-TO-CHAR to an object of type `cl:character'.~%~@
When argument is `cl:characterp' return it.
When argument is `mon:char-code-integer-p' return its `code-char' value.
If neither of the above constraints is satsified signal an error.~%~@
When keyword W-NO-ERROR is non-nil do not signal an error, instead return
argument CHAR-CODE-INTEGER-TO-CHAR.
:EXAMPLE~%
\(char-code-integer-to-char 9658\)~%
\(char-code-integer-to-char #\\►\)~%
\(char-code-integer-to-char nil\)~%
\(char-code-integer-to-char \"string\"\)~%
\(char-code-integer-to-char \"string\" :w-no-error t\)~%~@
:SEE-ALSO `mon:char-code-integer-p', `mon:char-code-integer-to-string',
`mon:char-to-string', `char-list-to-string', `mon:char-code-integer',
`mon:char-or-char-code-integer-or-string-1-ensure-char'.~%▶▶▶")
(fundoc 'char-or-char-code-integer-or-string-1-ensure-char
"If CHAR-OR-CHAR-CODE-INTEGER-OR-STRING-1 may be coerced to a character do so.~%~@
Signal an error if char-or-char-code-integer-or-string-1 is not of type:
`cl:character', `mon:char-code-integer', `mon:simple-string-of-length-1', `mon:string-of-length-1'
:EXAMPLE~%
\(char-or-char-code-integer-or-string-1-ensure-char #\\a\)~%
\(char-or-char-code-integer-or-string-1-ensure-char 0\)~%
\(char-or-char-code-integer-or-string-1-ensure-char \(format nil \"~~C\" #\\TAB\)\)~%
\(char-or-char-code-integer-or-string-1-ensure-char
\(make-array 1 :element-type 'character :initial-element #\\nul :adjustable t :fill-pointer 0\)\)~%~@
;; Following fail successfully:~%
\(char-or-char-code-integer-or-string-1-ensure-char \(1+ char-code-limit\)\)~%
\(char-or-char-code-integer-or-string-1-ensure-char \"ab\"\)~%
\(char-or-char-code-integer-or-string-1-ensure-char \"\"\)~%
\(char-or-char-code-integer-or-string-1-ensure-char
\(make-array 2 :element-type 'character :initial-element #\\nul :adjustable t :fill-pointer 0\)\)~%~@
:SEE-ALSO `mon:char-code-integer-p', `mon:char-code-integer-to-string',
`mon:char-to-string', `char-list-to-string', `mon:char-code-integer'.~%▶▶▶")
(fundoc 'char-ascii-table
"Return a list of conses mapping integers to an ASCII string equivalent.~%~@
Keyword CASE is one of { :lower | :upper | :lower-upper | :upper-lower }.~%~@
When CASE is :LOWER map [a,z] to integers [1,26].~%
When CASE is :UPPER map integers map [A,Z] to integers [1,26]~%
When CASE is :LOWER-UPPER map [a,z] to integers [1,26]
map [A,Z] to integers [27,52]~%~@
When CASE is :LOWER-UPPER map [A,Z] to integers [1,26]
map [a,z] to integers [27,52]~%~@
:EXAMPLE~%
\(char-ascii-table :case :lower\)~%
\(char-ascii-table :case :upper\)~%
\(char-ascii-table :case :upper-lower\)~%
\(char-ascii-table :case :lower-upper\)~%~@
:SEE-ALSO `<XREF>'.~%▶▶▶")
(fundoc 'char-list-to-string
"Convert charcters of CHAR-LIST to string.~%~@
CHAR-LIST should satisfy `mon:each-a-character-p'. Signal an error if not.~%~@
Optional arg STREAM is a destination stream default string to.~%~@
:EXAMPLE~%
\(char-list-to-string '\(#\\a #\\b 99\)~%
\(char-list-to-string '\(#\\a #\\b #\\c\)\)~%
;; (char-list-to-string (list #\a 98 #\c 9658))
;; (char-list-to-string (list #\a #\b #\c))
;; (char-list-to-string (list 97 97 99 9658))
(with-open-stream (s (make-string-output-stream))
(char-list-to-string '(#\a 98 #\c 9658) s)
(char-list-to-string '(#\a #\b #\c) s)
(char-list-to-string '(97 98 99 9658) s)
(get-output-stream-string s))
:SEE-ALSO `<XREF>'.~%▶▶▶")
(fundoc 'max-char
"The upper exclusive bound on values produced by CHAR-CODE~%~@
:EXAMPLE~%
\(max-char\)~%~@
:EMACS-LISP-COMPAT~%~@
:SEE-ALSO `char-code-limit' `char-code', `code-char', `char-name', `name-char',
`char-upcase', `char-downcase', `char-int', `schar', `digit-char', `character',
`standard-char-p', `graphic-char-p', `alpha-char-p',`digit-char-p',
`alphanumericp', `upper-case-p', `lower-case-p', `both-case-p', `char=',
`char/=', `char<', `char>', `char<=', `char>=', `char-equal',
`char-not-equal+'.~%▶▶▶")
(fundoc 'char-for-readtable-case
"Return CASE-FROB-CHAR according to the `cl:readtable-case' of READTABLE~%~@
When optional arg READTABLE is provided it should satisfy `cl:readtable', signal
an error if not. When ommitted default to value of `cl:*readtable*'.~%~@
:EXAMPLE~%
\(readtable-case *readtable*\)~%
\(char-for-readtable-case #\\a\)~%
\(char-for-readtable-case #\\A\)~%
\(char-for-readtable-case #\\SPACE\)~%~@
:SEE-ALSO `char-invert-case-maybe', `mon:string-invert-case',
`mon:string-for-readtable-case', `mon:read-symbol-name-preserving-case',
`mon:read-symbol-name-preserving-case-if', `cl:char-downcase', `cl:char-upcase',
`cl:upper-case-p', `cl:lower-case-p''.~%▶▶▶")
(fundoc 'char-invert-case-maybe
"Convert CHAR-TO-INVERT accoring to MODE of `cl:readtable-case' for `cl:*readtable*'.~%~@
Keyword CASE is a case sensitivity mode, when non-nil it should be valid value per:~%
\(setf \(readtable-case <READTABLE\) MODE\)~%~@
Possible arguments for CASE are:~%
:preserve :upcase :downcase :invert~%~@
Default is :preserve. If CASE is not a member of the above enumeration it
defaults to :preserve.~%~@
:EXAMPLE~%
\(char-to-invert #\\A\)~%
\(char-to-invert #\\A :case :downcase\)~%
\(char-to-invert #\\A :case :upcase\)~%
\(char-to-invert #\\a :case :upcase\)~%~@
:SEE-ALSO `char-for-readtable-case', `mon:string-invert-case',
`mon:string-for-readtable-case', `mon:read-symbol-name-preserving-case',
`mon:read-symbol-name-preserving-case-if', `cl:char-downcase', `cl:char-upcase',
`cl:upper-case-p', `cl:lower-case-p''.~%▶▶▶")
#+sbcl
(setf (documentation 'char-length 'function)
#.(format nil
"Return the number of bytes required to represent MB-CHAR.~%~@
:EXAMPLE~%
\(char-length #\\►\)~%
\(char-length #\\a\)~%
\(char-length #\\FF\)~%~@
:NOTE UTF-8 centric.~%~@
:SEE-ALSO `char-code-limit' `char-code', `code-char', `char-name', `name-char',
`char-upcase', `char-downcase', `char-int', `schar', `digit-char', `character',
`base-char', `standard-char', `extended-char', `standard-char-p',
`graphic-char-p', `alpha-char-p',`digit-char-p', `alphanumericp',
`upper-case-p', `lower-case-p', `both-case-p', `char=', `char/=', `char<',
`char>', `char<=', `char>=', `char-equal', `char-not-equal+'.~%▶▶▶"))
(fundoc 'char-escape-as-unicode-octochar-string
"Convert CHAR-TO-ESCAPE to a string in Unicode octal rerpesentation.~%~@
:EXAMPLE~%
\(char-escape-as-unicode-octochar-string #\\▶\)
=> \"\\\\U000025B6\" ~%~@
:SEE-ALSO `mon:string-escape-as-unicode-octo-chars'.~%▶▶▶")
(fundoc 'string-escape-as-unicode-octo-chars
"Convert STRING-TO-ESCAPE to a string in Unicode octal rerpesentation.~%~@
:EXAMPLE~%~@
\(string-escape-as-unicode-octo-chars \"∀∃≣∧∨¬\"\)
=> \"\\\\U00002200\\\\U00002203\\\\U00002263\\\\U00002227\\\\U00002228\\\\U000000AC\"~%
\(string-escape-as-unicode-octo-chars \"\"\)
=> \"\"~%~@
:SEE-ALSO `mon:char-escape-as-unicode-octochar-string'.~%▶▶▶")
;;; ==============================
;; Local Variables:
;; indent-tabs-mode: nil
;; show-trailing-whitespace: t
;; mode: lisp-interaction
;; package: mon
;; End:
;;; ==============================
;;; EOF