~ chicken-core (master) /tests/unicode-tests.scm
Trap1;;; unicode tests, taken from Chibi23(import (chicken port) (chicken sort))4(import (chicken string) (chicken io))5(import (chicken bytevector))6(import (only (scheme base) write-string))78(include "test.scm")910(test-begin "scheme")1112(test-equal #\Р (string-ref "Русский" 0))13(test-equal #\и (string-ref "Русский" 5))14(test-equal #\й (string-ref "Русский" 6))1516(test-equal 7 (string-length "Русский"))1718(test-equal #\日 (string-ref "日本語" 0))19(test-equal #\本 (string-ref "日本語" 1))20(test-equal #\語 (string-ref "日本語" 2))2122(test-equal 3 (string-length "日本語"))2324(test-equal '(#\日 #\本 #\語) (string->list "日本語"))25(test-equal "日本語" (list->string '(#\日 #\本 #\語)))2627(test-equal "日本" (substring "日本語" 0 2))28(test-equal "本語" (substring "日本語" 1 3))2930(test-equal "日-語"31 (let ((s (substring "日本語" 0 3)))32 (string-set! s 1 #\-)33 s))3435(test-equal "日本人"36 (let ((s (substring "日本語" 0 3)))37 (string-set! s 2 #\人)38 s))3940(test-equal "字字字" (make-string 3 #\字))4142(test-equal "字字字"43 (let ((s (make-string 3)))44 (string-fill! s #\字)45 s))4647; tests from the utf8 egg:4849(test-equal 2 (string-length "漢字"))5051(test-equal 28450 (char->integer (string-ref "漢字" 0)))5253(define str (string-copy "漢字"))5455(test-equal "赤字" (begin (string-set! str 0 (string-ref "赤" 0)) str))5657(test-equal "赤外" (begin (string-set! str 1 (string-ref "外" 0)) str))5859(test-equal "赤x" (begin (string-set! str 1 #\x) str))6061(test-equal "赤々" (begin (string-set! str 1 (string-ref "々" 0)) str))6263(test-equal "文字列" (substring "文字列" 0))64(test-equal "字列" (substring "文字列" 1))65(test-equal "列" (substring "文字列" 2))66(test-equal "文" (substring "文字列" 0 1))67(test-equal "字" (substring "文字列" 1 2))68(test-equal "文字" (substring "文字列" 0 2))6970(define *string* "文字列")71(define *list* '("文" "字" "列"))72(define *chars* '(25991 23383 21015))7374(test-equal *chars* (map char->integer (string->list "文字列")))7576(test-equal *list* (map string (map integer->char *chars*)))7778(test-equal *string* (list->string (map integer->char '(25991 23383 21015))))7980(test-equal "列列列" (make-string 3 (string-ref "列" 0)))8182(test-equal "文文文" (let ((s (string-copy "abc"))) (string-fill! s (string-ref "文" 0)) s))8384(test-equal (string-ref "ハ" 0) (with-input-from-string "全角ハンカク"85 (lambda () (read-char) (read-char) (read-char))))8687(test-equal "個々" (with-output-to-string88 (lambda ()89 (write-char (string-ref "個" 0))90 (write-char (string-ref "々" 0)))))9192;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;93;; library9495(test-equal "出力改行\n" (with-output-to-string96 (lambda () (print "出" (string-ref "力" 0) "改行"))))9798(test-equal "出力" (with-output-to-string99 (lambda () (print* "出" (string-ref "力" 0) ""))))100101(test-equal "逆リスト→文字列" (reverse-list->string102 (map (cut string-ref <> 0)103 '("列" "字" "文" "→" "ト" "ス" "リ" "逆"))))104105(test-error (utf8->string #u8(255 1 2)))106(test-assert (utf8->string #u8(255 1 2) #f))107(test-equal (string-length (utf8->string #u8(255 1 2) #f)) 3)108109;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;110;; extras111112(test-equal "这是" (with-input-from-string "这是中文" (cut read-string 2)))113114(define s "abcdef")115(call-with-input-string "这是中文" (cut read-string! 2 s <> 2))116(test-equal "ab这是ef" s)117118(define s "这是中文")119(call-with-input-string "abcd" (cut read-string! 1 s <> 2))120(test-equal "这是a文" s)121122(test-equal "这是" (with-output-to-string (cut write-string "这是中文" (current-output-port) 0 2)))123124(test-equal "我爱她" (conc (with-input-from-string "我爱你"125 (cut read-token (lambda (c)126 (memv c (map (cut string-ref <> 0)127 '("爱" "您" "我"))))))128 "她"))129130(test-equal '("第一" "第二" "第三") (string-chop "第一第二第三" 2))131132(test-equal '("第一" "第二" "第三" "…") (string-chop "第一第二第三…" 2))133134(test-equal '("a" "bc" "第" "f几") (string-split "a,bc、第,f几" ",、"))135136(test-equal "THE QUICK BROWN FOX JUMPED OVER THE LAZY SLEEPING DOG"137 (string-translate "the quick brown fox jumped over the lazy sleeping dog"138 "abcdefghijklmnopqrstuvwxyz"139 "ABCDEFGHIJKLMNOPQRSTUVWXYZ"))140(test-equal ":foo:bar:baz" (string-translate "/foo/bar/baz" "/" ":"))141(test-equal "你爱我" (string-translate "我爱你" "我你" "你我"))142(test-equal "你爱我" (string-translate "我爱你" '(#\我 #\你) '(#\你 #\我)))143(test-equal "我你" (string-translate "我爱你" "爱"))144(test-equal "我你" (string-translate "我爱你" #\爱))145146(test-assert (substring=? "日本語" "日本語"))147(test-assert (substring=? "日本語" "日本"))148(test-assert (substring=? "日本" "日本語"))149(test-assert (substring=? "日本語" "本語" 1))150(test-assert (substring=? "日本語" "本" 1 0 1))151(test-assert (substring=? "听说上海的东西很贵" "上海的东西很便宜" 2 0 5))152153(test-equal 2 (substring-index "上海" "听说上海的东西很贵"))154155;; case folding156157(test-assert (string-ci=? "abc" "ABC"))158(test-assert (string-ci=? "Xῌηιx" "xηιῌX"))159(test-assert (string-ci=? "αβξ" "αβξ"))160(test-assert (string-ci=? "αβξ" "ΑΒΞ"))161162(test-end)163164(test-exit)165