fix incorrect folder name for julia-0.6.x

Former-commit-id: ef2c7401e0876f22d2f7762d182cfbcd5a7d9c70
2018-06-11 03:28:36 -07:00
parent 5e0e436e4e
commit 0e4acfb8f2
722 changed files with 0 additions and 0 deletions
@@ -0,0 +1,484 @@
+# This file is a part of Julia. License is MIT: https://julialang.org/license
+
+# constructors
+@test String([0x61,0x62,0x63,0x21]) == "abc!"
+@test String("abc!") == "abc!"
+
+@test isempty(string())
+@test eltype(GenericString) == Char
+@test start("abc") == 1
+@test cmp("ab","abc") == -1
+
+# {starts,ends}with
+@test startswith("abcd", 'a')
+@test startswith("abcd", "a")
+@test startswith("abcd", "ab")
+@test !startswith("ab", "abcd")
+@test !startswith("abcd", "bc")
+@test endswith("abcd", 'd')
+@test endswith("abcd", "d")
+@test endswith("abcd", "cd")
+@test !endswith("abcd", "dc")
+@test !endswith("cd", "abcd")
+@test startswith("ab\0cd", "ab\0c")
+@test !startswith("ab\0cd", "ab\0d")
+
+@test filter(x -> x ∈ ['f', 'o'], "foobar") == "foo"
+
+# string iteration, and issue #1454
+str = "é"
+str_a = vcat(str...)
+@test length(str_a)==1
+@test str_a[1] == str[1]
+
+str = "s\u2200"
+@test str[1:end] == str
+
+# sizeof
+@test sizeof("abc") == 3
+@test sizeof("\u2222") == 3
+
+# issue #3597
+@test string(GenericString("Test")[1:1], "X") == "TX"
+
+for T = (UInt8,Int8,UInt16,Int16,UInt32,Int32,UInt64,Int64,UInt128,Int128,BigInt),
+    b = 2:62, _ = 1:10
+    n = T != BigInt ? rand(T) : BigInt(rand(Int128))
+    @test parse(T,base(b,n),b) == n
+end
+
+# issue #6027
+let
+    # make symbol with invalid char
+    sym = Symbol(Char(0xdcdb))
+    @test string(sym) == string(Char(0xdcdb))
+    @test String(sym) == string(Char(0xdcdb))
+    @test expand(sym) === sym
+    res = string(parse(string(Char(0xdcdb)," = 1"),1,raise=false)[1])
+    @test res == """\$(Expr(:error, "invalid character \\\"\\udcdb\\\"\"))"""
+end
+
+@test Symbol("asdf") === :asdf
+@test Symbol(:abc,"def",'g',"hi",0) === :abcdefghi0
+@test :a < :b
+@test startswith(string(gensym("asdf")),"##asdf#")
+@test gensym("asdf") != gensym("asdf")
+@test gensym() != gensym()
+@test startswith(string(gensym()),"##")
+@test_throws ArgumentError Symbol("ab\0")
+@test_throws ArgumentError gensym("ab\0")
+
+# issue #6949
+let f =IOBuffer(),
+    x = split("1 2 3")
+    @test write(f, x) == 3
+    @test String(take!(f)) == "123"
+    @test invoke(write, Tuple{IO, AbstractArray}, f, x) == 3
+    @test String(take!(f)) == "123"
+end
+
+# issue #7248
+@test_throws BoundsError ind2chr("hello", -1)
+@test_throws BoundsError chr2ind("hello", -1)
+@test_throws BoundsError ind2chr("hellø", -1)
+@test_throws BoundsError chr2ind("hellø", -1)
+@test_throws BoundsError ind2chr("hello", 10)
+@test_throws BoundsError chr2ind("hello", 10)
+@test_throws BoundsError ind2chr("hellø", 10)
+@test_throws BoundsError chr2ind("hellø", 10)
+@test_throws BoundsError checkbounds("hello", 0)
+@test_throws BoundsError checkbounds("hello", 6)
+@test_throws BoundsError checkbounds("hello", 0:3)
+@test_throws BoundsError checkbounds("hello", 4:6)
+@test_throws BoundsError checkbounds("hello", [0:3;])
+@test_throws BoundsError checkbounds("hello", [4:6;])
+@test checkbounds("hello", 2)
+@test checkbounds("hello", 1:5)
+@test checkbounds("hello", [1:5;])
+
+# issue #15624 (indexing with out of bounds empty range)
+@test ""[10:9] == ""
+@test "hello"[10:9] == ""
+@test "hellø"[10:9] == ""
+@test SubString("hello", 1, 6)[10:9] == ""
+@test SubString("hello", 1, 0)[10:9] == ""
+@test SubString("hellø", 1, 6)[10:9] == ""
+@test SubString("hellø", 1, 0)[10:9] == ""
+@test SubString("", 1, 6)[10:9] == ""
+@test SubString("", 1, 0)[10:9] == ""
+
+
+#=
+# issue #7764
+let
+    srep = repeat("Σβ",2)
+    s="Σβ"
+    ss=SubString(s,1,endof(s))
+
+    @test repeat(ss,2) == "ΣβΣβ"
+
+    @test endof(srep) == 7
+
+    @test next(srep, 3) == ('β',5)
+    @test next(srep, 7) == ('β',9)
+
+    @test srep[7] == 'β'
+    @test_throws BoundsError srep[8]
+end
+=#
+
+# This caused JuliaLang/JSON.jl#82
+@test first('\x00':'\x7f') === '\x00'
+@test last('\x00':'\x7f') === '\x7f'
+
+# make sure substrings handle last code unit even if not start of codepoint
+let s = "x\u0302"
+    @test s[1:3] == s
+end
+
+# issue #9781
+# float(SubString) wasn't tolerant of trailing whitespace, which was different
+# to "normal" strings. This also checks we aren't being too tolerant and allowing
+# any arbitrary trailing characters.
+@test parse(Float64,"1\n") == 1.0
+@test [parse(Float64,x) for x in split("0,1\n",",")][2] == 1.0
+@test_throws ArgumentError parse(Float64,split("0,1 X\n",",")[2])
+@test parse(Float32,"1\n") == 1.0
+@test [parse(Float32,x) for x in split("0,1\n",",")][2] == 1.0
+@test_throws ArgumentError parse(Float32,split("0,1 X\n",",")[2])
+
+@test ucfirst("Hola")=="Hola"
+@test ucfirst("hola")=="Hola"
+@test ucfirst("")==""
+@test ucfirst("*")=="*"
+
+@test lcfirst("Hola")=="hola"
+@test lcfirst("hola")=="hola"
+@test lcfirst("")==""
+@test lcfirst("*")=="*"
+
+# test AbstractString functions at beginning of string.jl
+struct tstStringType <: AbstractString
+    data::Array{UInt8,1}
+end
+tstr = tstStringType("12")
+@test_throws ErrorException endof(tstr)
+@test_throws ErrorException next(tstr, Bool(1))
+
+gstr = GenericString("12")
+@test typeof(string(gstr))==GenericString
+
+@test convert(Array{UInt8}, gstr) ==[49;50]
+@test convert(Array{Char,1}, gstr) ==['1';'2']
+@test convert(Symbol, gstr)==Symbol("12")
+
+@test gstr[1] == '1'
+@test gstr[1:1] == "1"
+@test gstr[[1]] == "1"
+
+@test done(eachindex("foobar"),7)
+@test eltype(Base.EachStringIndex) == Int
+@test map(uppercase, "foó") == "FOÓ"
+@test chr2ind("fóobar",3) == 4
+
+@test Symbol(gstr)==Symbol("12")
+
+@test_throws ErrorException sizeof(gstr)
+
+@test length(GenericString(""))==0
+
+@test nextind(1:1, 1) == 2
+@test nextind([1], 1) == 2
+
+@test ind2chr(gstr,2)==2
+
+# issue #10307
+@test typeof(map(Int16,AbstractString[])) == Vector{Int16}
+
+for T in [Int8, UInt8, Int16, UInt16, Int32, UInt32, Int64, UInt64, Int128, UInt128]
+    for i in [typemax(T), typemin(T)]
+        s = "$i"
+        @test get(tryparse(T, s)) == i
+    end
+end
+
+for T in [Int8, Int16, Int32, Int64, Int128]
+    for i in [typemax(T), typemin(T)]
+        f = "$(i)0"
+        @test isnull(tryparse(T, f))
+    end
+end
+
+# issue #11142
+s = "abcdefghij"
+sp = pointer(s)
+@test unsafe_string(sp) == s
+@test unsafe_string(sp,5) == "abcde"
+@test typeof(unsafe_string(sp)) == String
+s = "abcde\uff\u2000\U1f596"
+sp = pointer(s)
+@test unsafe_string(sp) == s
+@test unsafe_string(sp,5) == "abcde"
+@test typeof(unsafe_string(sp)) == String
+
+@test get(tryparse(BigInt, "1234567890")) == BigInt(1234567890)
+@test isnull(tryparse(BigInt, "1234567890-"))
+
+@test get(tryparse(Float64, "64")) == 64.0
+@test isnull(tryparse(Float64, "64o"))
+@test get(tryparse(Float32, "32")) == 32.0f0
+@test isnull(tryparse(Float32, "32o"))
+
+# issue #10994: handle embedded NUL chars for string parsing
+for T in [BigInt, Int8, UInt8, Int16, UInt16, Int32, UInt32, Int64, UInt64, Int128, UInt128]
+    @test_throws ArgumentError parse(T, "1\0")
+end
+for T in [BigInt, Int8, UInt8, Int16, UInt16, Int32, UInt32, Int64, UInt64, Int128, UInt128, Float64, Float32]
+    @test isnull(tryparse(T, "1\0"))
+end
+let s = normalize_string("tést",:NFKC)
+    @test unsafe_string(Base.unsafe_convert(Cstring, Base.cconvert(Cstring, s))) == s
+    @test unsafe_string(convert(Cstring, Symbol(s))) == s
+end
+@test_throws ArgumentError Base.unsafe_convert(Cstring, Base.cconvert(Cstring, "ba\0d"))
+
+cstrdup(s) = @static is_windows() ? ccall(:_strdup, Cstring, (Cstring,), s) : ccall(:strdup, Cstring, (Cstring,), s)
+let p = cstrdup("hello")
+    @test unsafe_string(p) == "hello"
+    Libc.free(p)
+end
+
+# iteration
+@test [c for c in "ḟøøƀäṙ"] == ['ḟ', 'ø', 'ø', 'ƀ', 'ä', 'ṙ']
+@test [i for i in eachindex("ḟøøƀäṙ")] == [1, 4, 6, 8, 10, 12]
+@test [x for x in enumerate("ḟøøƀäṙ")] == [(1, 'ḟ'), (2, 'ø'), (3, 'ø'), (4, 'ƀ'), (5, 'ä'), (6, 'ṙ')]
+
+# test all edge conditions
+for (val, pass) in (
+        (0, true), (0xd7ff, true),
+        (0xd800, false), (0xdfff, false),
+        (0xe000, true), (0xffff, true),
+        (0x10000, true), (0x10ffff, true),
+        (0x110000, false)
+    )
+    @test isvalid(Char, val) == pass
+end
+for (val, pass) in (
+        (b"\x00", true),
+        (b"\x7f", true),
+        (b"\x80", false),
+        (b"\xbf", false),
+        (b"\xc0", false),
+        (b"\xff", false),
+        (b"\xc0\x80", false),
+        (b"\xc1\x80", false),
+        (b"\xc2\x80", true),
+        (b"\xc2\xc0", false),
+        (b"\xed\x9f\xbf", true),
+        (b"\xed\xa0\x80", false),
+        (b"\xed\xbf\xbf", false),
+        (b"\xee\x80\x80", true),
+        (b"\xef\xbf\xbf", true),
+        (b"\xf0\x90\x80\x80", true),
+        (b"\xf4\x8f\xbf\xbf", true),
+        (b"\xf4\x90\x80\x80", false),
+        (b"\xf5\x80\x80\x80", false),
+        (b"\ud800\udc00", false),
+        (b"\udbff\udfff", false),
+        (b"\ud800\u0100", false),
+        (b"\udc00\u0100", false),
+        (b"\udc00\ud800", false)
+        )
+    @test isvalid(String, val) == pass == isvalid(String(val))
+end
+
+# Issue #11203
+@test isvalid(String, UInt8[]) == true == isvalid("")
+
+# Check UTF-8 characters
+# Check ASCII range (true),
+# then single continuation bytes and lead bytes with no following continuation bytes (false)
+for (rng,flg) in ((0:0x7f, true), (0x80:0xff, false))
+    for byt in rng
+        @test isvalid(String, UInt8[byt]) == flg
+    end
+end
+# Check overlong lead bytes for 2-character sequences (false)
+for byt = 0xc0:0xc1
+    @test isvalid(String, UInt8[byt,0x80]) == false
+end
+# Check valid lead-in to two-byte sequences (true)
+for byt = 0xc2:0xdf
+    for (rng,flg) in ((0x00:0x7f, false), (0x80:0xbf, true), (0xc0:0xff, false))
+        for cont in rng
+            @test isvalid(String, UInt8[byt, cont]) == flg
+        end
+    end
+end
+# Check three-byte sequences
+for r1 in (0xe0:0xec, 0xee:0xef)
+    for byt = r1
+        # Check for short sequence
+        @test isvalid(String, UInt8[byt]) == false
+        for (rng,flg) in ((0x00:0x7f, false), (0x80:0xbf, true), (0xc0:0xff, false))
+            for cont in rng
+                @test isvalid(String, UInt8[byt, cont]) == false
+                @test isvalid(String, UInt8[byt, cont, 0x80]) == flg
+            end
+        end
+    end
+end
+# Check hangul characters (0xd000-0xd7ff) hangul
+# Check for short sequence, or start of surrogate pair
+for (rng,flg) in ((0x00:0x7f, false), (0x80:0x9f, true), (0xa0:0xff, false))
+    for cont in rng
+        @test isvalid(String, UInt8[0xed, cont]) == false
+        @test isvalid(String, UInt8[0xed, cont, 0x80]) == flg
+    end
+end
+# Check valid four-byte sequences
+for byt = 0xf0:0xf4
+    if (byt == 0xf0)
+        r0 = ((0x00:0x8f, false), (0x90:0xbf, true), (0xc0:0xff, false))
+    elseif byt == 0xf4
+        r0 = ((0x00:0x7f, false), (0x80:0x8f, true), (0x90:0xff, false))
+    else
+        r0 = ((0x00:0x7f, false), (0x80:0xbf, true), (0xc0:0xff, false))
+    end
+    for (rng,flg) in r0
+        for cont in rng
+            @test isvalid(String, UInt8[byt, cont]) == false
+            @test isvalid(String, UInt8[byt, cont, 0x80]) == false
+            @test isvalid(String, UInt8[byt, cont, 0x80, 0x80]) == flg
+        end
+    end
+end
+# Check five-byte sequences, should be invalid
+for byt = 0xf8:0xfb
+    @test isvalid(String, UInt8[byt, 0x80, 0x80, 0x80, 0x80]) == false
+end
+# Check six-byte sequences, should be invalid
+for byt = 0xfc:0xfd
+    @test isvalid(String, UInt8[byt, 0x80, 0x80, 0x80, 0x80, 0x80]) == false
+end
+# Check seven-byte sequences, should be invalid
+@test isvalid(String, UInt8[0xfe, 0x80, 0x80, 0x80, 0x80, 0x80]) == false
+
+# 11482
+
+# lower and upper
+@test uppercase("aBc") == "ABC"
+@test uppercase('A') == 'A'
+@test uppercase('a') == 'A'
+@test lowercase("AbC") == "abc"
+@test lowercase('A') == 'a'
+@test lowercase('a') == 'a'
+@test uppercase('α') == '\u0391'
+@test lowercase('Δ') == 'δ'
+@test lowercase('\U118bf') == '\U118df'
+@test uppercase('\U1044d') == '\U10425'
+@test ucfirst("Abc") == "Abc"
+@test ucfirst("abc") == "Abc"
+@test lcfirst("ABC") == "aBC"
+@test lcfirst("aBC") == "aBC"
+@test ucfirst(GenericString("")) == ""
+@test lcfirst(GenericString("")) == ""
+@test ucfirst(GenericString("a")) == "A"
+@test lcfirst(GenericString("A")) == "a"
+@test lcfirst(GenericString("a")) == "a"
+@test ucfirst(GenericString("A")) == "A"
+
+# titlecase
+@test titlecase('ǉ') == 'ǈ'
+@test titlecase("ǉubljana") == "ǈubljana"
+@test titlecase("aBc ABC") == "ABc ABC"
+@test titlecase("abcD   EFG\n\thij") == "AbcD   EFG\n\tHij"
+
+# issue # 11464: uppercase/lowercase of GenericString becomes a String
+str = "abcdef\uff\uffff\u10ffffABCDEF"
+@test typeof(uppercase("abcdef")) == String
+@test typeof(uppercase(GenericString(str))) == String
+@test typeof(lowercase("ABCDEF")) == String
+@test typeof(lowercase(GenericString(str))) == String
+
+foomap(ch) = (ch > Char(65))
+foobar(ch) = Char(0xd800)
+foobaz(ch) = reinterpret(Char, typemax(UInt32))
+@test_throws ArgumentError map(foomap, GenericString(str))
+@test map(foobar, GenericString(str)) == String(repeat(b"\ud800", outer=[17]))
+@test map(foobaz, GenericString(str)) == String(repeat(b"\ufffd", outer=[17]))
+
+@test "a".*["b","c"] == ["ab","ac"]
+@test ["b","c"].*"a" == ["ba","ca"]
+@test ["a","b"].*["c" "d"] == ["ac" "ad"; "bc" "bd"]
+
+@test one(String) == ""
+@test prod(["*" for i in 1:3]) == "***"
+@test prod(["*" for i in 1:0]) == ""
+
+# Make sure NULL pointers are handled consistently by String
+@test_throws ArgumentError unsafe_string(Ptr{UInt8}(0))
+@test_throws ArgumentError unsafe_string(Ptr{UInt8}(0), 10)
+
+# ascii works on ASCII strings and fails on non-ASCII strings
+@test ascii("Hello, world") == "Hello, world"
+@test typeof(ascii("Hello, world")) == String
+@test ascii(GenericString("Hello, world")) == "Hello, world"
+@test typeof(ascii(GenericString("Hello, world"))) == String
+@test_throws ArgumentError ascii("Hello, ∀")
+@test_throws ArgumentError ascii(GenericString("Hello, ∀"))
+
+# issue #17271: endof() doesn't throw an error even with invalid strings
+@test endof(String(b"\x90")) == 0
+@test endof(String(b"\xce")) == 1
+
+# issue #17624, missing getindex method for String
+@test "abc"[:] == "abc"
+
+# issue #18280: next/nextind must return past String's underlying data
+for s in ("Hello", "Σ", "こんにちは", "😊😁")
+    @test next(s, endof(s))[2] > sizeof(s)
+    @test nextind(s, endof(s)) > sizeof(s)
+end
+
+# Test cmp with AbstractStrings that don't index the same as UTF-8, which would include
+# (LegacyString.)UTF16String and (LegacyString.)UTF32String, among others.
+
+mutable struct CharStr <: AbstractString
+    chars::Vector{Char}
+    CharStr(x) = new(collect(x))
+end
+Base.start(x::CharStr) = start(x.chars)
+Base.next(x::CharStr, i::Int) = next(x.chars, i)
+Base.done(x::CharStr, i::Int) = done(x.chars, i)
+Base.endof(x::CharStr) = endof(x.chars)
+
+# Simple case, with just ANSI Latin 1 characters
+@test "áB" != CharStr("áá") # returns false with bug
+@test cmp("áB", CharStr("áá")) == -1 # returns 0 with bug
+
+# Case with Unicode characters
+@test cmp("\U1f596\U1f596", CharStr("\U1f596")) == 1   # Gives BoundsError with bug
+@test cmp(CharStr("\U1f596"), "\U1f596\U1f596") == -1
+
+# repeat function
+@test repeat("xx",3) == repeat("x",6) == "xxxxxx"
+@test repeat("αα",3) == repeat("α",6) == "αααααα"
+
+# issue #12495: check that logical indexing attempt raises ArgumentError
+@test_throws ArgumentError "abc"[[true, false, true]]
+@test_throws ArgumentError "abc"[BitArray([true, false, true])]
+
+@testset "invalid code point" begin
+    s = String([0x61, 0xba, 0x41])
+    @test !isvalid(s)
+    @test_throws UnicodeError s[2]
+    e = try
+        s[2]
+    catch e
+        e
+    end
+    b = IOBuffer()
+    show(b, e)
+    @test String(take!(b)) == "UnicodeError: invalid character index 2 (0xba is a continuation byte)"
+end
@@ -0,0 +1,276 @@
+# This file is a part of Julia. License is MIT: https://julialang.org/license
+
+# string escaping & unescaping
+cx = Any[
+    0x00000000      '\0'        "\\0"
+    0x00000001      '\x01'      "\\x01"
+    0x00000006      '\x06'      "\\x06"
+    0x00000007      '\a'        "\\a"
+    0x00000008      '\b'        "\\b"
+    0x00000009      '\t'        "\\t"
+    0x0000000a      '\n'        "\\n"
+    0x0000000b      '\v'        "\\v"
+    0x0000000c      '\f'        "\\f"
+    0x0000000d      '\r'        "\\r"
+    0x0000000e      '\x0e'      "\\x0e"
+    0x0000001a      '\x1a'      "\\x1a"
+    0x0000001b      '\e'        "\\e"
+    0x0000001c      '\x1c'      "\\x1c"
+    0x0000001f      '\x1f'      "\\x1f"
+    0x00000020      ' '         " "
+    0x0000002f      '/'         "/"
+    0x00000030      '0'         "0"
+    0x00000039      '9'         "9"
+    0x0000003a      ':'         ":"
+    0x00000040      '@'         "@"
+    0x00000041      'A'         "A"
+    0x0000005a      'Z'         "Z"
+    0x0000005b      '['         "["
+    0x00000060      '`'         "`"
+    0x00000061      'a'         "a"
+    0x0000007a      'z'         "z"
+    0x0000007b      '{'         "{"
+    0x0000007e      '~'         "~"
+    0x0000007f      '\x7f'      "\\x7f"
+    0x000000bf      '\ubf'      "\\ubf"
+    0x000000ff      '\uff'      "\\uff"
+    0x00000100      '\u100'     "\\u100"
+    0x000001ff      '\u1ff'     "\\u1ff"
+    0x00000fff      '\ufff'     "\\ufff"
+    0x00001000      '\u1000'    "\\u1000"
+    0x00001fff      '\u1fff'    "\\u1fff"
+    0x0000ffff      '\uffff'    "\\uffff"
+    0x00010000      '\U10000'   "\\U10000"
+    0x0001ffff      '\U1ffff'   "\\U1ffff"
+    0x0002ffff      '\U2ffff'   "\\U2ffff"
+    0x00030000      '\U30000'   "\\U30000"
+    0x000dffff      '\Udffff'   "\\Udffff"
+    0x000e0000      '\Ue0000'   "\\Ue0000"
+    0x000effff      '\Ueffff'   "\\Ueffff"
+    0x000f0000      '\Uf0000'   "\\Uf0000"
+    0x000fffff      '\Ufffff'   "\\Ufffff"
+    0x00100000      '\U100000'  "\\U100000"
+    0x0010ffff      '\U10ffff'  "\\U10ffff"
+]
+
+for i = 1:size(cx,1)
+    cp, ch, st = cx[i,:]
+    @test cp == convert(UInt32, ch)
+    @test string(ch) == unescape_string(st)
+    if isascii(ch) || !isprint(ch)
+        @test st == escape_string(string(ch))
+    end
+    for j = 1:size(cx,1)
+        str = string(ch, cx[j,2])
+        @test str == unescape_string(escape_string(str))
+    end
+    @test repr(ch) == "'$(isprint(ch) ? ch : st)'"
+end
+
+for i = 0:0x7f, p = ["","\0","x","xxx","\x7f","\uFF","\uFFF",
+                     "\uFFFF","\U10000","\U10FFF","\U10FFFF"]
+    c = Char(i)
+    cp = string(c,p)
+    op = string(Char(div(i,8)), oct(i%8), p)
+    hp = string(Char(div(i,16)), hex(i%16), p)
+    @test string(unescape_string(string("\\",oct(i,1),p))) == cp
+    @test string(unescape_string(string("\\",oct(i,2),p))) == cp
+    @test string(unescape_string(string("\\",oct(i,3),p))) == cp
+    @test string(unescape_string(string("\\",oct(i,4),p))) == op
+    @test string(unescape_string(string("\\x",hex(i,1),p))) == cp
+    @test string(unescape_string(string("\\x",hex(i,2),p))) == cp
+    @test string(unescape_string(string("\\x",hex(i,3),p))) == hp
+end
+
+@test "\z" == unescape_string("\z") == "z"
+@test "\X" == unescape_string("\X") == "X"
+@test "\AbC" == unescape_string("\AbC") == "AbC"
+
+@test "\0" == unescape_string("\\0")
+@test "\1" == unescape_string("\\1")
+@test "\7" == unescape_string("\\7")
+@test "\0x" == unescape_string("\\0x")
+@test "\1x" == unescape_string("\\1x")
+@test "\7x" == unescape_string("\\7x")
+@test "\00" == unescape_string("\\00")
+@test "\01" == unescape_string("\\01")
+@test "\07" == unescape_string("\\07")
+@test "\70" == unescape_string("\\70")
+@test "\71" == unescape_string("\\71")
+@test "\77" == unescape_string("\\77")
+@test "\00x" == unescape_string("\\00x")
+@test "\01x" == unescape_string("\\01x")
+@test "\07x" == unescape_string("\\07x")
+@test "\70x" == unescape_string("\\70x")
+@test "\71x" == unescape_string("\\71x")
+@test "\77x" == unescape_string("\\77x")
+@test "\000" == unescape_string("\\000")
+@test "\001" == unescape_string("\\001")
+@test "\007" == unescape_string("\\007")
+@test "\070" == unescape_string("\\070")
+@test "\071" == unescape_string("\\071")
+@test "\077" == unescape_string("\\077")
+@test "\170" == unescape_string("\\170")
+@test "\171" == unescape_string("\\171")
+@test "\177" == unescape_string("\\177")
+@test "\0001" == unescape_string("\\0001")
+@test "\0011" == unescape_string("\\0011")
+@test "\0071" == unescape_string("\\0071")
+@test "\0701" == unescape_string("\\0701")
+@test "\0711" == unescape_string("\\0711")
+@test "\0771" == unescape_string("\\0771")
+@test "\1701" == unescape_string("\\1701")
+@test "\1711" == unescape_string("\\1711")
+@test "\1771" == unescape_string("\\1771")
+
+@test "\x0" == unescape_string("\\x0")
+@test "\x1" == unescape_string("\\x1")
+@test "\xf" == unescape_string("\\xf")
+@test "\xF" == unescape_string("\\xF")
+@test "\x0x" == unescape_string("\\x0x")
+@test "\x1x" == unescape_string("\\x1x")
+@test "\xfx" == unescape_string("\\xfx")
+@test "\xFx" == unescape_string("\\xFx")
+@test "\x00" == unescape_string("\\x00")
+@test "\x01" == unescape_string("\\x01")
+@test "\x0f" == unescape_string("\\x0f")
+@test "\x0F" == unescape_string("\\x0F")
+
+# Tests of join()
+@test join([]) == ""
+@test join(["a"],"?") == "a"
+@test join("HELLO",'-') == "H-E-L-L-O"
+@test join(1:5, ", ", " and ") == "1, 2, 3, 4 and 5"
+@test join(["apples", "bananas", "pineapples"], ", ", " and ") == "apples, bananas and pineapples"
+
+# issue #9178 `join` calls `done()` twice on the iterables
+mutable struct i9178
+    nnext::Int64
+    ndone::Int64
+end
+Base.start(jt::i9178) = (jt.nnext=0 ; jt.ndone=0 ; 0)
+Base.done(jt::i9178, n) = (jt.ndone += 1 ; n > 3)
+Base.next(jt::i9178, n) = (jt.nnext += 1 ; ("$(jt.nnext),$(jt.ndone)", n+1))
+@test join(i9178(0,0), ";") == "1,1;2,2;3,3;4,4"
+
+# quotes + interpolation (issue #455)
+@test "$("string")" == "string"
+arr = ["a","b","c"]
+@test "[$(join(arr, " - "))]" == "[a - b - c]"
+
+# join with empty input
+myio = IOBuffer()
+join(myio, "", "", 1)
+@test isempty(take!(myio))
+
+# unescape_chars
+@test Base.unescape_chars("\\t","t") == "t"
+@test_throws ArgumentError unescape_string(IOBuffer(), string('\\',"xZ"))
+@test_throws ArgumentError unescape_string(IOBuffer(), string('\\',"777"))
+
+# 11659
+# The indentation code was not correctly counting tab stops
+@test Base.indentation("      \t") == (8, true)
+@test Base.indentation("  \tfoob") == (8, false)
+@test Base.indentation(" \t \t")   == (16, true)
+
+@test Base.unindent("\tfoo",0) == "\tfoo"
+@test Base.unindent("\tfoo",4) == "    foo"
+@test Base.unindent("    \tfoo",4) == "    foo"
+@test Base.unindent("\t\n    \tfoo",4) == "    \n    foo"
+@test Base.unindent("\tfoo\tbar",4) == "    foo     bar"
+@test Base.unindent("\n\tfoo",4) == "\n    foo"
+@test Base.unindent("\n    \tfoo",4) == "\n    foo"
+@test Base.unindent("\n\t\n    \tfoo",4) == "\n    \n    foo"
+@test Base.unindent("\n\tfoo\tbar",4) == "\n    foo     bar"
+
+# Tests of raw_str macro
+@test raw"$" == "\$"
+@test raw"\n" == "\\n"
+@test raw"\t" == "\\t"
+
+s1 = raw"""
+     lorem ipsum\n
+     $x = 1$
+     """
+
+s2 = """
+     lorem ipsum\\n
+     \$x = 1\$
+     """
+
+@test s1 == s2
+
+# issue #22021, string realloc bug with join
+s22021 = String["\"\"\"
+     non_max_suppression(boxes, scores, max_output_size; iou_threshold=nothing)
+
+Greedily selects a subset of bounding boxes in descending order of score,
+
+pruning away boxes that have high intersection-over-union (IOU) overlap
+with previously selected boxes.  Bounding boxes are supplied as
+[y1, x1, y2, x2], where (y1, x1) and (y2, x2) are the coordinates of any
+diagonal pair of box corners and the coordinates can be provided as normalized
+(i.e., lying in the interval [0, 1]) or absolute.  Note that this algorithm
+is agnostic to where the origin is in the coordinate system.  Note that this
+algorithm is invariant to orthogonal transformations and translations
+of the coordinate system; thus translating or reflections of the coordinate
+system result in the same boxes being selected by the algorithm.
+
+The output of this operation is a set of integers indexing into the input
+collection of bounding boxes representing the selected boxes.  The bounding
+box coordinates corresponding to the selected indices can then be obtained
+using the `tf.gather operation`.  For example:
+
+  selected_indices = tf.image.non_max_suppression(
+      boxes, scores, max_output_size, iou_threshold)
+  selected_boxes = tf.gather(boxes, selected_indices)
+\"\"\"",
+    "    tf.@op function non_max_suppression(v13566, v13567, v13568; name=nothing, iou_threshold=nothing) ",
+    "            local desc ",
+    "            tf.with_op_name((()->begin  ",
+    "                        desc = tf.NodeDescription(\"NonMaxSuppression\") ",
+    "                        begin  ",
+    "                            begin  ",
+    "                                v13566 = convert(TensorFlow.Tensor{Float32}, v13566) ",
+    "                                begin  ",
+    "                                end",
+    "                            end",
+    "                            begin  ",
+    "                                v13567 = convert(TensorFlow.Tensor{Float32}, v13567) ",
+    "                                begin  ",
+    "                                end",
+    "                            end",
+    "                            begin  ",
+    "                                v13568 = convert(TensorFlow.Tensor{Int32}, v13568) ",
+    "                                begin  ",
+    "                                end",
+    "                            end",
+    "                        end ",
+    "                        begin  ",
+    "                            begin  ",
+    "                                tf.add_input(desc, v13566)",
+    "                            end",
+    "                            begin  ",
+    "                                tf.add_input(desc, v13567)",
+    "                            end",
+    "                            begin  ",
+    "                                tf.add_input(desc, v13568)",
+    "                            end",
+    "                        end ",
+    "                        begin  ",
+    "                            begin  ",
+    "                                if iou_threshold !== nothing ",
+    "                                    desc[\"iou_threshold\"] = Base.identity(iou_threshold)",
+    "                                end",
+    "                            end",
+    "                        end",
+    "                    end), name, \"NonMaxSuppression\") ",
+    "            tf.Tensor(tf.Operation(desc))",
+    "        end"]
+
+for i = 1:10
+    buf = IOBuffer()
+    print(buf, join(s22021, "\n"))
+    @test isvalid(String, take!(buf))
+end
@@ -0,0 +1,377 @@
+# This file is a part of Julia. License is MIT: https://julialang.org/license
+
+# some test strings
+astr = "Hello, world.\n"
+u8str = "∀ ε > 0, ∃ δ > 0: |x-y| < δ ⇒ |f(x)-f(y)| < ε"
+
+# I think these should give error on 4 also, and "" is not treated
+# consistently with SubString("",1,1), nor with Char[]
+for ind in (0, 5)
+    @test_throws BoundsError search("foo", SubString("",1,1), ind)
+    @test_throws BoundsError rsearch("foo", SubString("",1,1), ind)
+    @test_throws BoundsError searchindex("foo", SubString("",1,1), ind)
+    @test_throws BoundsError rsearchindex("foo", SubString("",1,1), ind)
+end
+
+# Note: the commented out tests will be enabled after fixes to make
+# sure that search/rsearch/searchindex/rsearchindex are consistent
+# no matter what type of AbstractString the second argument is
+@test_throws BoundsError search("foo", Char[], 0)
+@test_throws BoundsError search("foo", Char[], 5)
+# @test_throws BoundsError rsearch("foo", Char[], 0)
+@test_throws BoundsError rsearch("foo", Char[], 5)
+
+# @test_throws BoundsError searchindex("foo", Char[], 0)
+# @test_throws BoundsError searchindex("foo", Char[], 5)
+# @test_throws BoundsError rsearchindex("foo", Char[], 0)
+# @test_throws BoundsError rsearchindex("foo", Char[], 5)
+
+# @test_throws ErrorException in("foobar","bar")
+@test_throws BoundsError search(b"\x1\x2",0x1,0)
+@test rsearchindex(b"foo",b"o",0) == 0
+@test rsearchindex(SubString("",1,1),SubString("",1,1)) == 1
+
+@test search(b"foo",'o') == 2
+@test rsearch(b"foo",'o') == 3
+@test search(b"foó",'ó') == 3
+@test rsearch(b"foó",'ó') == 3
+
+# ascii search
+for str in [astr, GenericString(astr)]
+    @test_throws BoundsError search(str, 'z', 0)
+    @test_throws BoundsError search(str, '∀', 0)
+    @test search(str, 'x') == 0
+    @test search(str, '\0') == 0
+    @test search(str, '\u80') == 0
+    @test search(str, '∀') == 0
+    @test search(str, 'H') == 1
+    @test search(str, 'l') == 3
+    @test search(str, 'l', 4) == 4
+    @test search(str, 'l', 5) == 11
+    @test search(str, 'l', 12) == 0
+    @test search(str, ',') == 6
+    @test search(str, ',', 7) == 0
+    @test search(str, '\n') == 14
+    @test search(str, '\n', 15) == 0
+    @test_throws BoundsError search(str, 'ε', nextind(str,endof(str))+1)
+    @test_throws BoundsError search(str, 'a', nextind(str,endof(str))+1)
+end
+
+# ascii rsearch
+for str in [astr]
+    @test rsearch(str, 'x') == 0
+    @test rsearch(str, '\0') == 0
+    @test rsearch(str, '\u80') == 0
+    @test rsearch(str, '∀') == 0
+    @test rsearch(str, 'H') == 1
+    @test rsearch(str, 'H', 0) == 0
+    @test rsearch(str, 'l') == 11
+    @test rsearch(str, 'l', 5) == 4
+    @test rsearch(str, 'l', 4) == 4
+    @test rsearch(str, 'l', 3) == 3
+    @test rsearch(str, 'l', 2) == 0
+    @test rsearch(str, ',') == 6
+    @test rsearch(str, ',', 5) == 0
+    @test rsearch(str, '\n') == 14
+end
+
+# utf-8 search
+for str in (u8str, GenericString(u8str))
+    @test_throws BoundsError search(str, 'z', 0)
+    @test_throws BoundsError search(str, '∀', 0)
+    @test search(str, 'z') == 0
+    @test search(str, '\0') == 0
+    @test search(str, '\u80') == 0
+    @test search(str, '∄') == 0
+    @test search(str, '∀') == 1
+    @test_throws UnicodeError search(str, '∀', 2)
+    @test search(str, '∀', 4) == 0
+    @test search(str, '∃') == 13
+    @test_throws UnicodeError search(str, '∃', 15)
+    @test search(str, '∃', 16) == 0
+    @test search(str, 'x') == 26
+    @test search(str, 'x', 27) == 43
+    @test search(str, 'x', 44) == 0
+    @test search(str, 'δ') == 17
+    @test_throws UnicodeError search(str, 'δ', 18)
+    @test search(str, 'δ', nextind(str,17)) == 33
+    @test search(str, 'δ', nextind(str,33)) == 0
+    @test search(str, 'ε') == 5
+    @test search(str, 'ε', nextind(str,5)) == 54
+    @test search(str, 'ε', nextind(str,54)) == 0
+    @test search(str, 'ε', nextind(str,endof(str))) == 0
+    @test search(str, 'a', nextind(str,endof(str))) == 0
+    @test_throws BoundsError search(str, 'ε', nextind(str,endof(str))+1)
+    @test_throws BoundsError search(str, 'a', nextind(str,endof(str))+1)
+end
+
+# utf-8 rsearch
+for str in [u8str]
+    @test rsearch(str, 'z') == 0
+    @test rsearch(str, '\0') == 0
+    @test rsearch(str, '\u80') == 0
+    @test rsearch(str, '∄') == 0
+    @test rsearch(str, '∀') == 1
+    @test rsearch(str, '∀', 0) == 0
+    @test rsearch(str, '∃') == 13
+    @test rsearch(str, '∃', 14) == 13
+    @test rsearch(str, '∃', 13) == 13
+    @test rsearch(str, '∃', 12) == 0
+    @test rsearch(str, 'x') == 43
+    @test rsearch(str, 'x', 42) == 26
+    @test rsearch(str, 'x', 25) == 0
+    @test rsearch(str, 'δ') == 33
+    @test rsearch(str, 'δ', 32) == 17
+    @test rsearch(str, 'δ', 16) == 0
+    @test rsearch(str, 'ε') == 54
+    @test rsearch(str, 'ε', 53) == 5
+    @test rsearch(str, 'ε', 4) == 0
+end
+
+# string search with a single-char string
+@test search(astr, "x") == 0:-1
+@test search(astr, "H") == 1:1
+@test search(astr, "H", 2) == 0:-1
+@test search(astr, "l") == 3:3
+@test search(astr, "l", 4) == 4:4
+@test search(astr, "l", 5) == 11:11
+@test search(astr, "l", 12) == 0:-1
+@test search(astr, "\n") == 14:14
+@test search(astr, "\n", 15) == 0:-1
+
+@test search(u8str, "z") == 0:-1
+@test search(u8str, "∄") == 0:-1
+@test search(u8str, "∀") == 1:1
+@test search(u8str, "∀", 4) == 0:-1
+@test search(u8str, "∃") == 13:13
+@test search(u8str, "∃", 16) == 0:-1
+@test search(u8str, "x") == 26:26
+@test search(u8str, "x", 27) == 43:43
+@test search(u8str, "x", 44) == 0:-1
+@test search(u8str, "ε") == 5:5
+@test search(u8str, "ε", 7) == 54:54
+@test search(u8str, "ε", 56) == 0:-1
+
+# string rsearch with a single-char string
+@test rsearch(astr, "x") == 0:-1
+@test rsearch(astr, "H") == 1:1
+@test rsearch(astr, "H", 2) == 1:1
+@test rsearch(astr, "H", 0) == 0:-1
+@test rsearch(astr, "l") == 11:11
+@test rsearch(astr, "l", 10) == 4:4
+@test rsearch(astr, "l", 4) == 4:4
+@test rsearch(astr, "l", 3) == 3:3
+@test rsearch(astr, "l", 2) == 0:-1
+@test rsearch(astr, "\n") == 14:14
+@test rsearch(astr, "\n", 13) == 0:-1
+
+@test rsearch(u8str, "z") == 0:-1
+@test rsearch(u8str, "∄") == 0:-1
+@test rsearch(u8str, "∀") == 1:1
+@test rsearch(u8str, "∀", 0) == 0:-1
+#TODO: setting the limit in the middle of a wide char
+#      makes search fail but rsearch succeed.
+#      Should rsearch fail as well?
+#@test rsearch(u8str, "∀", 2) == 0:-1 # gives 1:3
+@test rsearch(u8str, "∃") == 13:13
+@test rsearch(u8str, "∃", 12) == 0:-1
+@test rsearch(u8str, "x") == 43:43
+@test rsearch(u8str, "x", 42) == 26:26
+@test rsearch(u8str, "x", 25) == 0:-1
+@test rsearch(u8str, "ε") == 54:54
+@test rsearch(u8str, "ε", 53) == 5:5
+@test rsearch(u8str, "ε", 4) == 0:-1
+
+# string search with a single-char regex
+@test search(astr, r"x") == 0:-1
+@test search(astr, r"H") == 1:1
+@test search(astr, r"H", 2) == 0:-1
+@test search(astr, r"l") == 3:3
+@test search(astr, r"l", 4) == 4:4
+@test search(astr, r"l", 5) == 11:11
+@test search(astr, r"l", 12) == 0:-1
+@test search(astr, r"\n") == 14:14
+@test search(astr, r"\n", 15) == 0:-1
+@test search(u8str, r"z") == 0:-1
+@test search(u8str, r"∄") == 0:-1
+@test search(u8str, r"∀") == 1:1
+@test search(u8str, r"∀", 4) == 0:-1
+@test search(u8str, r"∀") == search(u8str, r"\u2200")
+@test search(u8str, r"∀", 4) == search(u8str, r"\u2200", 4)
+@test search(u8str, r"∃") == 13:13
+@test search(u8str, r"∃", 16) == 0:-1
+@test search(u8str, r"x") == 26:26
+@test search(u8str, r"x", 27) == 43:43
+@test search(u8str, r"x", 44) == 0:-1
+@test search(u8str, r"ε") == 5:5
+@test search(u8str, r"ε", 7) == 54:54
+@test search(u8str, r"ε", 56) == 0:-1
+for i = 1:endof(astr)
+    @test search(astr, r"."s, i) == i:i
+end
+for i = 1:endof(u8str)
+    if isvalid(u8str,i)
+        @test search(u8str, r"."s, i) == i:i
+    end
+end
+
+# string search with a zero-char string
+for i = 1:endof(astr)
+    @test search(astr, "", i) == i:i-1
+end
+for i = 1:endof(u8str)
+    @test search(u8str, "", i) == i:i-1
+end
+@test search("", "") == 1:0
+
+# string rsearch with a zero-char string
+for i = 1:endof(astr)
+    @test rsearch(astr, "", i) == i:i-1
+end
+for i = 1:endof(u8str)
+    @test rsearch(u8str, "", i) == i:i-1
+end
+@test rsearch("", "") == 1:0
+
+# string search with a zero-char regex
+for i = 1:endof(astr)
+    @test search(astr, r"", i) == i:i-1
+end
+for i = 1:endof(u8str)
+    # TODO: should regex search fast-forward invalid indices?
+    if isvalid(u8str,i)
+        @test search(u8str, r""s, i) == i:i-1
+    end
+end
+
+# string search with a two-char string literal
+@test search("foo,bar,baz", "xx") == 0:-1
+@test search("foo,bar,baz", "fo") == 1:2
+@test search("foo,bar,baz", "fo", 3) == 0:-1
+@test search("foo,bar,baz", "oo") == 2:3
+@test search("foo,bar,baz", "oo", 4) == 0:-1
+@test search("foo,bar,baz", "o,") == 3:4
+@test search("foo,bar,baz", "o,", 5) == 0:-1
+@test search("foo,bar,baz", ",b") == 4:5
+@test search("foo,bar,baz", ",b", 6) == 8:9
+@test search("foo,bar,baz", ",b", 10) == 0:-1
+@test search("foo,bar,baz", "az") == 10:11
+@test search("foo,bar,baz", "az", 12) == 0:-1
+
+# issue #9365
+# string search with a two-char UTF-8 (2 byte) string literal
+@test search("ééé", "éé") == 1:3
+@test search("ééé", "éé", 1) == 1:3
+# string search with a two-char UTF-8 (3 byte) string literal
+@test search("€€€", "€€") == 1:4
+@test search("€€€", "€€", 1) == 1:4
+# string search with a two-char UTF-8 (4 byte) string literal
+@test search("\U1f596\U1f596\U1f596", "\U1f596\U1f596") == 1:5
+@test search("\U1f596\U1f596\U1f596", "\U1f596\U1f596", 1) == 1:5
+
+# string search with a two-char UTF-8 (2 byte) string literal
+@test search("éé", "éé") == 1:3
+@test search("éé", "éé", 1) == 1:3
+# string search with a two-char UTF-8 (3 byte) string literal
+@test search("€€", "€€") == 1:4
+@test search("€€", "€€", 1) == 1:4
+# string search with a two-char UTF-8 (4 byte) string literal
+@test search("\U1f596\U1f596", "\U1f596\U1f596") == 1:5
+@test search("\U1f596\U1f596", "\U1f596\U1f596", 1) == 1:5
+
+# string rsearch with a two-char UTF-8 (2 byte) string literal
+@test rsearch("ééé", "éé") == 3:5
+@test rsearch("ééé", "éé", endof("ééé")) == 3:5
+# string rsearch with a two-char UTF-8 (3 byte) string literal
+@test rsearch("€€€", "€€") == 4:7
+@test rsearch("€€€", "€€", endof("€€€")) == 4:7
+# string rsearch with a two-char UTF-8 (4 byte) string literal
+@test rsearch("\U1f596\U1f596\U1f596", "\U1f596\U1f596") == 5:9
+@test rsearch("\U1f596\U1f596\U1f596", "\U1f596\U1f596", endof("\U1f596\U1f596\U1f596")) == 5:9
+
+# string rsearch with a two-char UTF-8 (2 byte) string literal
+@test rsearch("éé", "éé") == 1:3        # should really be 1:4!
+@test rsearch("éé", "éé", endof("ééé")) == 1:3
+# string search with a two-char UTF-8 (3 byte) string literal
+@test rsearch("€€", "€€") == 1:4        # should really be 1:6!
+@test rsearch("€€", "€€", endof("€€€")) == 1:4
+# string search with a two-char UTF-8 (4 byte) string literal
+@test rsearch("\U1f596\U1f596", "\U1f596\U1f596") == 1:5        # should really be 1:8!
+@test rsearch("\U1f596\U1f596", "\U1f596\U1f596", endof("\U1f596\U1f596\U1f596")) == 1:5
+
+# string rsearch with a two-char string literal
+@test rsearch("foo,bar,baz", "xx") == 0:-1
+@test rsearch("foo,bar,baz", "fo") == 1:2
+@test rsearch("foo,bar,baz", "fo", 1) == 0:-1
+@test rsearch("foo,bar,baz", "oo") == 2:3
+@test rsearch("foo,bar,baz", "oo", 2) == 0:-1
+@test rsearch("foo,bar,baz", "o,") == 3:4
+@test rsearch("foo,bar,baz", "o,", 1) == 0:-1
+@test rsearch("foo,bar,baz", ",b") == 8:9
+@test rsearch("foo,bar,baz", ",b", 6) == 4:5
+@test rsearch("foo,bar,baz", ",b", 3) == 0:-1
+@test rsearch("foo,bar,baz", "az") == 10:11
+@test rsearch("foo,bar,baz", "az", 10) == 0:-1
+
+# array rsearch
+@test rsearch(UInt8[1,2,3],UInt8[2,3],3) == 2:3
+@test rsearch(UInt8[1,2,3],UInt8[2,3],1) == 0:-1
+
+# string search with a two-char regex
+@test search("foo,bar,baz", r"xx") == 0:-1
+@test search("foo,bar,baz", r"fo") == 1:2
+@test search("foo,bar,baz", r"fo", 3) == 0:-1
+@test search("foo,bar,baz", r"oo") == 2:3
+@test search("foo,bar,baz", r"oo", 4) == 0:-1
+@test search("foo,bar,baz", r"o,") == 3:4
+@test search("foo,bar,baz", r"o,", 5) == 0:-1
+@test search("foo,bar,baz", r",b") == 4:5
+@test search("foo,bar,baz", r",b", 6) == 8:9
+@test search("foo,bar,baz", r",b", 10) == 0:-1
+@test search("foo,bar,baz", r"az") == 10:11
+@test search("foo,bar,baz", r"az", 12) == 0:-1
+
+@test searchindex("foo", 'o') == 2
+@test searchindex("foo", 'o', 3) == 3
+
+# string searchindex with a two-char UTF-8 (2 byte) string literal
+@test searchindex("ééé", "éé") == 1
+@test searchindex("ééé", "éé", 1) == 1
+# string searchindex with a two-char UTF-8 (3 byte) string literal
+@test searchindex("€€€", "€€") == 1
+@test searchindex("€€€", "€€", 1) == 1
+# string searchindex with a two-char UTF-8 (4 byte) string literal
+@test searchindex("\U1f596\U1f596\U1f596", "\U1f596\U1f596") == 1
+@test searchindex("\U1f596\U1f596\U1f596", "\U1f596\U1f596", 1) == 1
+
+# string searchindex with a two-char UTF-8 (2 byte) string literal
+@test searchindex("éé", "éé") == 1
+@test searchindex("éé", "éé", 1) == 1
+# string searchindex with a two-char UTF-8 (3 byte) string literal
+@test searchindex("€€", "€€") == 1
+@test searchindex("€€", "€€", 1) == 1
+# string searchindex with a two-char UTF-8 (4 byte) string literal
+@test searchindex("\U1f596\U1f596", "\U1f596\U1f596") == 1
+@test searchindex("\U1f596\U1f596", "\U1f596\U1f596", 1) == 1
+
+# string rsearchindex with a two-char UTF-8 (2 byte) string literal
+@test rsearchindex("ééé", "éé") == 3
+@test rsearchindex("ééé", "éé", endof("ééé")) == 3
+# string rsearchindex with a two-char UTF-8 (3 byte) string literal
+@test rsearchindex("€€€", "€€") == 4
+@test rsearchindex("€€€", "€€", endof("€€€")) == 4
+# string rsearchindex with a two-char UTF-8 (4 byte) string literal
+@test rsearchindex("\U1f596\U1f596\U1f596", "\U1f596\U1f596") == 5
+@test rsearchindex("\U1f596\U1f596\U1f596", "\U1f596\U1f596", endof("\U1f596\U1f596\U1f596")) == 5
+
+# string rsearchindex with a two-char UTF-8 (2 byte) string literal
+@test rsearchindex("éé", "éé") == 1
+@test rsearchindex("éé", "éé", endof("ééé")) == 1
+# string searchindex with a two-char UTF-8 (3 byte) string literal
+@test rsearchindex("€€", "€€") == 1
+@test rsearchindex("€€", "€€", endof("€€€")) == 1
+# string searchindex with a two-char UTF-8 (4 byte) string literal
+@test rsearchindex("\U1f596\U1f596", "\U1f596\U1f596") == 1
+@test rsearchindex("\U1f596\U1f596", "\U1f596\U1f596", endof("\U1f596\U1f596\U1f596")) == 1
+
+@test_throws ErrorException "ab" ∈ "abc"
@@ -0,0 +1,212 @@
+# This file is a part of Julia. License is MIT: https://julialang.org/license
+
+## SubString, RevString and Cstring tests ##
+
+## SubString tests ##
+u8str = "∀ ε > 0, ∃ δ > 0: |x-y| < δ ⇒ |f(x)-f(y)| < ε"
+u8str2 = u8str^2
+len_u8str = length(u8str)
+slen_u8str = length(u8str)
+len_u8str2 = length(u8str2)
+slen_u8str2 = length(u8str2)
+
+@test len_u8str2 == 2 * len_u8str
+@test slen_u8str2 == 2 * slen_u8str
+
+u8str2plain = String(u8str2)
+
+for i1 = 1:length(u8str2)
+    if !isvalid(u8str2, i1); continue; end
+    for i2 = i1:length(u8str2)
+        if !isvalid(u8str2, i2); continue; end
+        @test length(u8str2[i1:i2]) == length(u8str2plain[i1:i2])
+        @test length(u8str2[i1:i2]) == length(u8str2plain[i1:i2])
+        @test u8str2[i1:i2] == u8str2plain[i1:i2]
+    end
+end
+
+str="tempus fugit"              #length(str)==12
+ss=SubString(str,1,length(str)) #match source string
+@test length(ss)==length(str)
+
+ss=SubString(str,1,0)    #empty SubString
+@test length(ss)==0
+
+ss=SubString(str,14,20)  #start indexed beyond source string length
+@test length(ss)==0
+
+ss=SubString(str,10,16)  #end indexed beyond source string length
+@test length(ss)==3
+
+str2=""
+ss=SubString(str2,1,4)  #empty source string
+@test length(ss)==0
+
+ss=SubString(str2,1,1)  #empty source string, identical start and end index
+@test length(ss)==0
+
+@test SubString("foobar",big(1),big(3)) == "foo"
+
+str = "aa\u2200\u2222bb"
+u = SubString(str, 3, 6)
+@test length(u)==2
+b = IOBuffer()
+write(b, u)
+@test String(take!(b)) == "\u2200\u2222"
+
+@test_throws ArgumentError SubString(str, 4, 5)
+@test_throws BoundsError next(u, 0)
+@test_throws BoundsError next(u, 7)
+@test_throws BoundsError getindex(u, 0)
+@test_throws BoundsError getindex(u, 7)
+@test_throws BoundsError getindex(u, 0:1)
+@test_throws BoundsError getindex(u, 7:7)
+@test reverseind(u, 1) == 4
+@test typeof(Base.cconvert(Ptr{Int8},u)) == SubString{String}
+@test Base.cconvert(Ptr{Int8},u) == u
+
+str = "føøbar"
+u = SubString(str, 4, 3)
+@test length(u)==0
+b = IOBuffer()
+write(b, u)
+@test String(take!(b)) == ""
+
+str = "føøbar"
+u = SubString(str, 10, 10)
+@test length(u)==0
+b = IOBuffer()
+write(b, u)
+@test String(take!(b)) == ""
+
+# search and SubString (issue #5679)
+str = "Hello, world!"
+u = SubString(str, 1, 5)
+@test rsearch(u, "World") == 0:-1
+@test rsearch(u, 'z') == 0
+@test rsearch(u, "ll") == 3:4
+
+# sizeof
+@test sizeof(SubString("abc\u2222def",4,4)) == 3
+
+# issue #3710
+@test prevind(SubString("{var}",2,4),4) == 3
+
+# issue #4183
+@test split(SubString("x", 2, 0), "y") == AbstractString[""]
+
+# issue #6772
+@test float(SubString("10",1,1)) === 1.0
+@test float(SubString("1 0",1,1)) === 1.0
+@test parse(Float32,SubString("10",1,1)) === 1.0f0
+
+# issue #5870
+@test !ismatch(Regex("aa"), SubString("",1,0))
+@test ismatch(Regex(""), SubString("",1,0))
+
+# isvalid(), chr2ind() and ind2chr() for SubString{DirectIndexString}
+let s="lorem ipsum",
+    sdict=Dict(SubString(s,1,11)=>s,
+               SubString(s,1,6)=>"lorem ",
+               SubString(s,1,0)=>"",
+               SubString(s,2,4)=>"ore",
+               SubString(s,2,16)=>"orem ipsum",
+               SubString(s,12,14)=>""
+               )
+    for (ss,s) in sdict
+        for i in -1:12
+            @test isvalid(ss,i)==isvalid(s,i)
+        end
+    end
+    for (ss,s) in sdict
+        for i in 1:length(ss)
+            @test ind2chr(ss,i)==ind2chr(s,i)
+        end
+    end
+    for (ss,s) in sdict
+        for i in 1:length(ss)
+            @test chr2ind(ss,i)==chr2ind(s,i)
+        end
+    end
+end #let
+
+#for isvalid(SubString{String})
+let s = "Σx + βz - 2"
+  for i in -1:length(s)+2
+      ss=SubString(s,1,i)
+      @test isvalid(ss,i)==isvalid(s,i)
+  end
+end
+
+ss=SubString("hello",1,5)
+@test_throws BoundsError ind2chr(ss, -1)
+@test_throws BoundsError chr2ind(ss, -1)
+@test_throws BoundsError chr2ind(ss, 10)
+@test_throws BoundsError ind2chr(ss, 10)
+
+# length(SubString{String}) performance specialization
+let s = "|η(α)-ϕ(κ)| < ε"
+    @test length(SubString(s,1,0))==length(s[1:0])
+    @test length(SubString(s,4,4))==length(s[4:4])
+    @test length(SubString(s,1,7))==length(s[1:7])
+    @test length(SubString(s,4,11))==length(s[4:11])
+end
+
+## Reverse strings ##
+
+rs = RevString("foobar")
+@test length(rs) == 6
+@test sizeof(rs) == 6
+@test isascii(rs)
+
+# issue #4586
+@test rsplit(RevString("ailuj"),'l') == ["ju","ia"]
+@test parse(Float64,RevString("64")) === 46.0
+
+# reverseind
+for T in (String, GenericString)
+    for prefix in ("", "abcd", "\U0001d6a4\U0001d4c1", "\U0001d6a4\U0001d4c1c", " \U0001d6a4\U0001d4c1")
+        for suffix in ("", "abcde", "\U0001d4c1β\U0001d6a4", "\U0001d4c1β\U0001d6a4c", " \U0001d4c1β\U0001d6a4")
+            for c in ('X', 'δ', '\U0001d6a5')
+                s = convert(T, string(prefix, c, suffix))
+                r = reverse(s)
+                ri = search(r, c)
+                @test r == RevString(s)
+                @test c == s[reverseind(s, ri)] == r[ri]
+                s = RevString(s)
+                r = reverse(s)
+                ri = search(r, c)
+                @test c == s[reverseind(s, ri)] == r[ri]
+                s = convert(T, string(prefix, prefix, c, suffix, suffix))
+                pre = convert(T, prefix)
+                sb = SubString(s, nextind(pre, endof(pre)), endof(convert(T, string(prefix, prefix, c, suffix))))
+                r = reverse(sb)
+                ri = search(r, c)
+                @test c == sb[reverseind(sb, ri)] == r[ri]
+            end
+        end
+    end
+end
+
+## Cstring tests ##
+
+# issue #13974: comparison against pointers
+
+str = String("foobar")
+ptr = pointer(str)
+cstring = Cstring(ptr)
+@test ptr == cstring
+@test cstring == ptr
+
+# convenient NULL string creation from Ptr{Void}
+nullstr = Cstring(C_NULL)
+
+# Comparisons against NULL strings
+@test ptr != nullstr
+@test nullstr != ptr
+
+# Short-hand comparison against C_NULL
+@test nullstr == C_NULL
+@test C_NULL == nullstr
+@test cstring != C_NULL
+@test C_NULL != cstring
@@ -0,0 +1,237 @@
+# This file is a part of Julia. License is MIT: https://julialang.org/license
+
+# padding (lpad and rpad)
+@test lpad("foo", 3) == "foo"
+@test rpad("foo", 3) == "foo"
+@test lpad("foo", 5) == "  foo"
+@test rpad("foo", 5) == "foo  "
+@test lpad("foo", 5, "  ") == "  foo"
+@test rpad("foo", 5, "  ") == "foo  "
+@test lpad("foo", 6, "  ") == "   foo"
+@test rpad("foo", 6, "  ") == "foo   "
+
+# string manipulation
+@test strip("") == ""
+@test strip(" ") == ""
+@test strip("  ") == ""
+@test strip("   ") == ""
+@test strip("\t  hi   \n") == "hi"
+@test strip("foobarfoo", ['f','o']) == "bar"
+@test strip("foobarfoo", ('f','o')) == "bar"
+
+for s in ("", " ", " abc", "abc ", "  abc  "), f in (lstrip, rstrip, strip)
+    fs = f(s)
+    for T = (String, GenericString)
+        t = convert(T,s)
+        ft = f(t)
+        @test s == t
+        @test fs == ft
+        @test typeof(ft) == typeof(t[1:end])
+
+        b = convert(SubString{T}, t)
+        fb = f(b)
+        @test s == b
+        @test fs == fb
+        @test typeof(fb) == SubString{T}
+    end
+end
+
+# split
+@test isequal(split("foo,bar,baz", 'x'), ["foo,bar,baz"])
+@test isequal(split("foo,bar,baz", ','), ["foo","bar","baz"])
+@test isequal(split("foo,bar,baz", ","), ["foo","bar","baz"])
+@test isequal(split("foo,bar,baz", r","), ["foo","bar","baz"])
+@test isequal(split("foo,bar,baz", ','; limit=0), ["foo","bar","baz"])
+@test isequal(split("foo,bar,baz", ','; limit=1), ["foo,bar,baz"])
+@test isequal(split("foo,bar,baz", ','; limit=2), ["foo","bar,baz"])
+@test isequal(split("foo,bar,baz", ','; limit=3), ["foo","bar","baz"])
+@test isequal(split("foo,bar", "o,b"), ["fo","ar"])
+
+@test isequal(split("", ','), [""])
+@test isequal(split(",", ','), ["",""])
+@test isequal(split(",,", ','), ["","",""])
+@test isequal(split("", ','  ; keep=false), [])
+@test isequal(split(",", ',' ; keep=false), [])
+@test isequal(split(",,", ','; keep=false), [])
+
+@test isequal(split("a b c"), ["a","b","c"])
+@test isequal(split("a  b \t c\n"), ["a","b","c"])
+
+@test isequal(rsplit("foo,bar,baz", 'x'), ["foo,bar,baz"])
+@test isequal(rsplit("foo,bar,baz", ','), ["foo","bar","baz"])
+@test isequal(rsplit("foo,bar,baz", ","), ["foo","bar","baz"])
+@test isequal(rsplit("foo,bar,baz", ','; limit=0), ["foo","bar","baz"])
+@test isequal(rsplit("foo,bar,baz", ','; limit=1), ["foo,bar,baz"])
+@test isequal(rsplit("foo,bar,baz", ','; limit=2), ["foo,bar","baz"])
+@test isequal(rsplit("foo,bar,baz", ','; limit=3), ["foo","bar","baz"])
+@test isequal(rsplit("foo,bar", "o,b"), ["fo","ar"])
+
+@test isequal(rsplit("", ','), [""])
+@test isequal(rsplit(",", ','), ["",""])
+@test isequal(rsplit(",,", ','), ["","",""])
+@test isequal(rsplit(",,", ','; limit=2), [",",""])
+@test isequal(rsplit("", ','  ; keep=false), [])
+@test isequal(rsplit(",", ',' ; keep=false), [])
+@test isequal(rsplit(",,", ','; keep=false), [])
+
+#@test isequal(rsplit("a b c"), ["a","b","c"])
+#@test isequal(rsplit("a  b \t c\n"), ["a","b","c"])
+
+let str = "a.:.ba..:..cba.:.:.dcba.:."
+@test isequal(split(str, ".:."), ["a","ba.",".cba",":.dcba",""])
+@test isequal(split(str, ".:."; keep=false), ["a","ba.",".cba",":.dcba"])
+@test isequal(split(str, ".:."), ["a","ba.",".cba",":.dcba",""])
+@test isequal(split(str, r"\.(:\.)+"), ["a","ba.",".cba","dcba",""])
+@test isequal(split(str, r"\.(:\.)+"; keep=false), ["a","ba.",".cba","dcba"])
+@test isequal(split(str, r"\.+:\.+"), ["a","ba","cba",":.dcba",""])
+@test isequal(split(str, r"\.+:\.+"; keep=false), ["a","ba","cba",":.dcba"])
+
+@test isequal(rsplit(str, ".:."), ["a","ba.",".cba.:","dcba",""])
+@test isequal(rsplit(str, ".:."; keep=false), ["a","ba.",".cba.:","dcba"])
+@test isequal(rsplit(str, ".:."; limit=2), ["a.:.ba..:..cba.:.:.dcba", ""])
+@test isequal(rsplit(str, ".:."; limit=3), ["a.:.ba..:..cba.:", "dcba", ""])
+@test isequal(rsplit(str, ".:."; limit=4), ["a.:.ba.", ".cba.:", "dcba", ""])
+@test isequal(rsplit(str, ".:."; limit=5), ["a", "ba.", ".cba.:", "dcba", ""])
+@test isequal(rsplit(str, ".:."; limit=6), ["a", "ba.", ".cba.:", "dcba", ""])
+end
+
+# zero-width splits
+@test isequal(rsplit("", ""), [""])
+
+@test isequal(split("", ""), [""])
+@test isequal(split("", r""), [""])
+@test isequal(split("abc", ""), ["a","b","c"])
+@test isequal(split("abc", r""), ["a","b","c"])
+@test isequal(split("abcd", r"b?"), ["a","c","d"])
+@test isequal(split("abcd", r"b*"), ["a","c","d"])
+@test isequal(split("abcd", r"b+"), ["a","cd"])
+@test isequal(split("abcd", r"b?c?"), ["a","d"])
+@test isequal(split("abcd", r"[bc]?"), ["a","","d"])
+@test isequal(split("abcd", r"a*"), ["","b","c","d"])
+@test isequal(split("abcd", r"a+"), ["","bcd"])
+@test isequal(split("abcd", r"d*"), ["a","b","c",""])
+@test isequal(split("abcd", r"d+"), ["abc",""])
+@test isequal(split("abcd", r"[ad]?"), ["","b","c",""])
+
+# replace
+@test replace("\u2202", '*', '\0') == "\u2202"
+
+@test replace("foobar", 'o', '0') == "f00bar"
+@test replace("foobar", 'o', '0', 1) == "f0obar"
+@test replace("foobar", 'o', "") == "fbar"
+@test replace("foobar", 'o', "", 1) == "fobar"
+@test replace("foobar", 'f', 'F') == "Foobar"
+@test replace("foobar", 'r', 'R') == "foobaR"
+
+@test replace("foofoofoo", "foo", "bar") == "barbarbar"
+@test replace("foobarfoo", "foo", "baz") == "bazbarbaz"
+@test replace("barfoofoo", "foo", "baz") == "barbazbaz"
+
+@test replace("", "", "") == ""
+@test replace("", "", "x") == "x"
+@test replace("", "x", "y") == ""
+
+@test replace("abcd", "", "^") == "^a^b^c^d^"
+@test replace("abcd", "b", "^") == "a^cd"
+@test replace("abcd", r"b?", "^") == "^a^c^d^"
+@test replace("abcd", r"b+", "^") == "a^cd"
+@test replace("abcd", r"b?c?", "^") == "^a^d^"
+@test replace("abcd", r"[bc]?", "^") == "^a^^d^"
+
+@test replace("foobarfoo", r"(fo|ba)", "xx") == "xxoxxrxxo"
+@test replace("foobarfoo", r"(foo|ba)", "bar") == "barbarrbar"
+
+@test replace("foobar", 'o', 'ø') == "føøbar"
+@test replace("foobar", 'o', 'ø', 1) == "føobar"
+@test replace("føøbar", 'ø', 'o') == "foobar"
+@test replace("føøbar", 'ø', 'o', 1) == "foøbar"
+@test replace("føøbar", 'ø', 'ö') == "fööbar"
+@test replace("føøbar", 'ø', 'ö', 1) == "föøbar"
+@test replace("føøbar", 'ø', "") == "fbar"
+@test replace("føøbar", 'ø', "", 1) == "føbar"
+@test replace("føøbar", 'f', 'F') == "Føøbar"
+@test replace("ḟøøbar", 'ḟ', 'F') == "Føøbar"
+@test replace("føøbar", 'f', 'Ḟ') == "Ḟøøbar"
+@test replace("ḟøøbar", 'ḟ', 'Ḟ') == "Ḟøøbar"
+@test replace("føøbar", 'r', 'R') == "føøbaR"
+@test replace("føøbaṙ", 'ṙ', 'R') == "føøbaR"
+@test replace("føøbar", 'r', 'Ṙ') == "føøbaṘ"
+@test replace("føøbaṙ", 'ṙ', 'Ṙ') == "føøbaṘ"
+
+@test replace("ḟøøḟøøḟøø", "ḟøø", "bar") == "barbarbar"
+@test replace("ḟøøbarḟøø", "ḟøø", "baz") == "bazbarbaz"
+@test replace("barḟøøḟøø", "ḟøø", "baz") == "barbazbaz"
+
+@test replace("foofoofoo", "foo", "ƀäṙ") == "ƀäṙƀäṙƀäṙ"
+@test replace("fooƀäṙfoo", "foo", "baz") == "bazƀäṙbaz"
+@test replace("ƀäṙfoofoo", "foo", "baz") == "ƀäṙbazbaz"
+
+@test replace("foofoofoo", "foo", "bar") == "barbarbar"
+@test replace("foobarfoo", "foo", "ƀäż") == "ƀäżbarƀäż"
+@test replace("barfoofoo", "foo", "ƀäż") == "barƀäżƀäż"
+
+@test replace("ḟøøḟøøḟøø", "ḟøø", "ƀäṙ") == "ƀäṙƀäṙƀäṙ"
+@test replace("ḟøøƀäṙḟøø", "ḟøø", "baz") == "bazƀäṙbaz"
+@test replace("ƀäṙḟøøḟøø", "ḟøø", "baz") == "ƀäṙbazbaz"
+
+@test replace("ḟøøḟøøḟøø", "ḟøø", "bar") == "barbarbar"
+@test replace("ḟøøbarḟøø", "ḟøø", "ƀäż") == "ƀäżbarƀäż"
+@test replace("barḟøøḟøø", "ḟøø", "ƀäż") == "barƀäżƀäż"
+
+@test replace("ḟøøḟøøḟøø", "ḟøø", "ƀäṙ") == "ƀäṙƀäṙƀäṙ"
+@test replace("ḟøøƀäṙḟøø", "ḟøø", "ƀäż") == "ƀäżƀäṙƀäż"
+@test replace("ƀäṙḟøøḟøø", "ḟøø", "ƀäż") == "ƀäṙƀäżƀäż"
+
+@test replace("", "", "ẍ") == "ẍ"
+@test replace("", "ẍ", "ÿ") == ""
+
+@test replace("äƀçđ", "", "π") == "πäπƀπçπđπ"
+@test replace("äƀçđ", "ƀ", "π") == "äπçđ"
+@test replace("äƀçđ", r"ƀ?", "π") == "πäπçπđπ"
+@test replace("äƀçđ", r"ƀ+", "π") == "äπçđ"
+@test replace("äƀçđ", r"ƀ?ç?", "π") == "πäπđπ"
+@test replace("äƀçđ", r"[ƀç]?", "π") == "πäππđπ"
+
+@test replace("foobarfoo", r"(fo|ba)", "ẍẍ") == "ẍẍoẍẍrẍẍo"
+
+@test replace("ḟøøbarḟøø", r"(ḟø|ba)", "xx") == "xxøxxrxxø"
+@test replace("ḟøøbarḟøø", r"(ḟøø|ba)", "bar") == "barbarrbar"
+
+@test replace("fooƀäṙfoo", r"(fo|ƀä)", "xx") == "xxoxxṙxxo"
+@test replace("fooƀäṙfoo", r"(foo|ƀä)", "ƀäṙ") == "ƀäṙƀäṙṙƀäṙ"
+
+@test replace("ḟøøƀäṙḟøø", r"(ḟø|ƀä)", "xx") == "xxøxxṙxxø"
+@test replace("ḟøøƀäṙḟøø", r"(ḟøø|ƀä)", "ƀäṙ") == "ƀäṙƀäṙṙƀäṙ"
+
+@test replace("foo", "oo", uppercase) == "fOO"
+
+# Issue 13332
+@test replace("abc", 'b', 2.1) == "a2.1c"
+
+# chomp/chop
+@test chomp("foo\n") == "foo"
+@test chop("fooε") == "foo"
+@test isa(chomp("foo"), SubString)
+@test isa(chop("foo"), SubString)
+
+# bytes2hex and hex2bytes
+hex_str = "d7a8fbb307d7809469ca9abcb0082e4f8d5651e46d3cdb762d02d0bf37c9e592"
+bin_val = hex2bytes(hex_str)
+
+@test div(length(hex_str), 2) == length(bin_val)
+@test hex_str == bytes2hex(bin_val)
+
+bin_val = hex2bytes("07bf")
+@test bin_val[1] == 7
+@test bin_val[2] == 191
+@test typeof(bin_val) == Array{UInt8, 1}
+@test length(bin_val) == 2
+
+# all valid hex chars
+@test "0123456789abcdefabcdef" == bytes2hex(hex2bytes("0123456789abcdefABCDEF"))
+
+# odd size
+@test_throws ArgumentError hex2bytes("0123456789abcdefABCDEF0")
+
+#non-hex characters
+@test_throws ArgumentError hex2bytes("0123456789abcdefABCDEFGH")