| 1 | 
  
    ## oils_failures_allowed: 1
   | 
  | 2 | 
  
    
   | 
  | 3 | 
  
    
   | 
  | 4 | 
  
    
   | 
  | 5 | 
  
    source $REPO_ROOT/spec/testdata/unicode.sh
   | 
  | 6 | 
  
    
   | 
  | 7 | 
  
    # bash agrees
   | 
  | 8 | 
  
    echo "farmer scalars =" ${#farmer}
   | 
  | 9 | 
  
    
   | 
  | 10 | 
  
    echo "facepalm scalars =" ${#facepalm}
   | 
  | 11 | 
  
    
   | 
  | 12 | 
  
    echo "farmer len =" $[len(farmer)]
   | 
  | 13 | 
  
    
   | 
  | 14 | 
  
    echo "facepalm len =" $[len(facepalm)]
   | 
  | 15 | 
  
    
   | 
  | 16 | 
  
    ## STDOUT:
   | 
  | 17 | 
  
    farmer scalars = 4
   | 
  | 18 | 
  
    facepalm scalars = 5
   | 
  | 19 | 
  
    farmer len = 15
   | 
  | 20 | 
  
    facepalm len = 17
   | 
  | 21 | 
  
    ## END
   | 
  | 22 | 
  
    
   | 
  | 23 | 
  
    
   | 
  | 24 | 
  
    
   | 
  | 25 | 
  
    
   | 
  | 26 | 
  
    py-decode() {
   | 
  | 27 | 
  
      python2 -c 'import json, sys; print json.load(sys.stdin).encode("utf-8")'
   | 
  | 28 | 
  
    }
   | 
  | 29 | 
  
    
   | 
  | 30 | 
  
    to-hex() {
   | 
  | 31 | 
  
      od -A n -t x1
   | 
  | 32 | 
  
    }
   | 
  | 33 | 
  
    
   | 
  | 34 | 
  
    max='"\udbff\udfff"'
   | 
  | 35 | 
  
    
   | 
  | 36 | 
  
    # incrementing by one gives invalid surrogates
   | 
  | 37 | 
  
    # the encoding is "tight"
   | 
  | 38 | 
  
    # too_big='"\udc00\udfff"'
   | 
  | 39 | 
  
    
   | 
  | 40 | 
  
    echo "$max" | py-decode | to-hex
   | 
  | 41 | 
  
    
   | 
  | 42 | 
  
    echo "$max" | json read
   | 
  | 43 | 
  
    echo "$_reply" | to-hex
   | 
  | 44 | 
  
    
   | 
  | 45 | 
  
    ## STDOUT:
   | 
  | 46 | 
  
     f4 8f bf bf 0a
   | 
  | 47 | 
  
     f4 8f bf bf 0a
   | 
  | 48 | 
  
    ## END
   | 
  | 49 | 
  
    
   | 
  | 50 | 
  
    
   | 
  | 51 | 
  
    
   | 
  | 52 | 
  
    
   | 
  | 53 | 
  
    
   | 
  | 54 | 
  
    json8 read <<EOF
   | 
  | 55 | 
  
    u'\u{110000}'
   | 
  | 56 | 
  
    EOF
   | 
  | 57 | 
  
    echo status=$?
   | 
  | 58 | 
  
    
   | 
  | 59 | 
  
    ## STDOUT:
   | 
  | 60 | 
  
    status=1
   | 
  | 61 | 
  
    ## END
   | 
  | 62 | 
  
    
   | 
  | 63 | 
  
    
   | 
  | 64 | 
  
    
   | 
  | 65 | 
  
    
   | 
  | 66 | 
  
    # Sanity check first: Python interpreter DOES check big code points,
   | 
  | 67 | 
  
    # whereas shells don't
   | 
  | 68 | 
  
    
   | 
  | 69 | 
  
    max=$(python2 -c 'print u"\U0010ffff".encode("utf-8")')
   | 
  | 70 | 
  
    echo status max=$?
   | 
  | 71 | 
  
    
   | 
  | 72 | 
  
    too_big=$(python2 -c 'print u"\U00110000".encode("utf-8")')
   | 
  | 73 | 
  
    echo status too_big=$?
   | 
  | 74 | 
  
    
   | 
  | 75 | 
  
    #echo py max=$max
   | 
  | 76 | 
  
    #echo py too_big=$too_big
   | 
  | 77 | 
  
    
   | 
  | 78 | 
  
    # python2 -c 'import sys; c = sys.argv[1].decode("utf-8"); print len(c)' "$ok"
   | 
  | 79 | 
  
    # python2 -c 'import sys; c = sys.argv[1].decode("utf-8"); print len(c)' "$too_big"
   | 
  | 80 | 
  
    
   | 
  | 81 | 
  
    var max = u'\u{10ffff}'
   | 
  | 82 | 
  
    pp line (max)
   | 
  | 83 | 
  
    
   | 
  | 84 | 
  
    var too_big = u'\u{110000}'
   | 
  | 85 | 
  
    pp line (too_big)  # should not get here
   | 
  | 86 | 
  
    
   | 
  | 87 | 
  
    # These are errors too
   | 
  | 88 | 
  
    var max = b'\u{10ffff}'
   | 
  | 89 | 
  
    var too_big = b'\u{110000}'
   | 
  | 90 | 
  
    
   | 
  | 91 | 
  
    ## status: 2
   | 
  | 92 | 
  
    ## STDOUT:
   | 
  | 93 | 
  
    status max=0
   | 
  | 94 | 
  
    status too_big=1
   | 
  | 95 | 
  
    (Str)   ""
   | 
  | 96 | 
  
    ## END
   | 
  | 97 | 
  
    
   | 
  | 98 | 
  
    
   | 
  | 99 | 
  
    
   | 
  | 100 | 
  
    
   | 
  | 101 | 
  
    max=$(bash <<'EOF'
   | 
  | 102 | 
  
    echo $'\U0010ffff'
   | 
  | 103 | 
  
    EOF
   | 
  | 104 | 
  
    )
   | 
  | 105 | 
  
    
   | 
  | 106 | 
  
    # bash allows the bad one
   | 
  | 107 | 
  
    too_big=$(bash <<'EOF'
   | 
  | 108 | 
  
    echo $'\U00110000'
   | 
  | 109 | 
  
    EOF
   | 
  | 110 | 
  
    )
   | 
  | 111 | 
  
    
   | 
  | 112 | 
  
    echo "var x = u'"$max"'; = x" | $SH
   | 
  | 113 | 
  
    echo status=$?
   | 
  | 114 | 
  
    #pp line (_reply)
   | 
  | 115 | 
  
    
   | 
  | 116 | 
  
    echo "var x = u'"$too_big"'; = x" | $SH
   | 
  | 117 | 
  
    echo status=$?
   | 
  | 118 | 
  
    #pp line (_reply)
   | 
  | 119 | 
  
    
   | 
  | 120 | 
  
    ## STDOUT:
   | 
  | 121 | 
  
    ## END
   | 
  | 122 | 
  
    
   | 
  | 123 | 
  
    
   | 
  | 124 | 
  
    
   | 
  | 125 | 
  
    
   | 
  | 126 | 
  
    max=$(bash <<'EOF'
   | 
  | 127 | 
  
    echo $'\U0010ffff'
   | 
  | 128 | 
  
    EOF
   | 
  | 129 | 
  
    )
   | 
  | 130 | 
  
    
   | 
  | 131 | 
  
    # bash allows the bad one
   | 
  | 132 | 
  
    too_big=$(bash <<'EOF'
   | 
  | 133 | 
  
    echo $'\U00110000'
   | 
  | 134 | 
  
    EOF
   | 
  | 135 | 
  
    )
   | 
  | 136 | 
  
    
   | 
  | 137 | 
  
    # JSON string
   | 
  | 138 | 
  
    
   | 
  | 139 | 
  
    echo '"'$max'"' | json read
   | 
  | 140 | 
  
    echo status=$?
   | 
  | 141 | 
  
    #pp line (_reply)
   | 
  | 142 | 
  
    
   | 
  | 143 | 
  
    # Need to propagate the reason here
   | 
  | 144 | 
  
    
   | 
  | 145 | 
  
    echo '"'$too_big'"' | json read
   | 
  | 146 | 
  
    echo status=$?
   | 
  | 147 | 
  
    #pp line (_reply)
   | 
  | 148 | 
  
    
   | 
  | 149 | 
  
    
   | 
  | 150 | 
  
    # J8 string
   | 
  | 151 | 
  
    
   | 
  | 152 | 
  
    echo "u'"$max"'" | json8 read
   | 
  | 153 | 
  
    echo status=$?
   | 
  | 154 | 
  
    #pp line (_reply)
   | 
  | 155 | 
  
    
   | 
  | 156 | 
  
    echo "u'"$too_big"'" | json8 read
   | 
  | 157 | 
  
    echo status=$?
   | 
  | 158 | 
  
    #pp line (_reply)
   | 
  | 159 | 
  
    
   | 
  | 160 | 
  
    ## STDOUT:
   | 
  | 161 | 
  
    status=0
   | 
  | 162 | 
  
    status=1
   | 
  | 163 | 
  
    status=0
   | 
  | 164 | 
  
    status=1
   | 
  | 165 | 
  
    ## END
   | 
  | 166 | 
  
    
   | 
  | 167 | 
  
    
   | 
  | 168 | 
  
    
   | 
  | 169 | 
  
    var max = u'\u{10ffff}'
   | 
  | 170 | 
  
    
   | 
  | 171 | 
  
    json write (max)
   | 
  | 172 | 
  
    json8 write (max)
   | 
  | 173 | 
  
    
   | 
  | 174 | 
  
    = max
   | 
  | 175 | 
  
    pp line (max)
   | 
  | 176 | 
  
    
   | 
  | 177 | 
  
    #echo "var x = u'"$max"'; = x" | $SH
   | 
  | 178 | 
  
    
   | 
  | 179 | 
  
    ## STDOUT:
   | 
  | 180 | 
  
    ""
   | 
  | 181 | 
  
    ""
   | 
  | 182 | 
  
    (Str)   ''
   | 
  | 183 | 
  
    (Str)   ""
   | 
  | 184 | 
  
    ## END
   |