43 lines
1.3 KiB
Text
43 lines
1.3 KiB
Text
/-
|
|
Copyright (c) 2016 Microsoft Corporation. All rights reserved.
|
|
Released under Apache 2.0 license as described in the file LICENSE.
|
|
Author: Leonardo de Moura
|
|
-/
|
|
prelude
|
|
import init.char init.list
|
|
attribute [reducible]
|
|
definition string := list char
|
|
|
|
namespace string
|
|
|
|
attribute [pattern]
|
|
definition empty : string := list.nil
|
|
|
|
attribute [pattern]
|
|
definition str : char → string → string := list.cons
|
|
|
|
definition concat (a b : string) : string :=
|
|
list.append b a
|
|
end string
|
|
|
|
attribute [instance]
|
|
definition string.has_append : has_append string :=
|
|
⟨string.concat⟩
|
|
|
|
open list
|
|
|
|
private definition utf8_length_aux : nat → nat → string → nat
|
|
| 0 r (c::s) :=
|
|
let n := char.to_nat c in
|
|
if n < 0x80 then utf8_length_aux 0 (r+1) s
|
|
else if 0xC0 ≤ n ∧ n < 0xE0 then utf8_length_aux 1 (r+1) s
|
|
else if 0xE0 ≤ n ∧ n < 0xF0 then utf8_length_aux 2 (r+1) s
|
|
else if 0xF0 ≤ n ∧ n < 0xF8 then utf8_length_aux 3 (r+1) s
|
|
else if 0xF8 ≤ n ∧ n < 0xFC then utf8_length_aux 4 (r+1) s
|
|
else if 0xFC ≤ n ∧ n < 0xFE then utf8_length_aux 5 (r+1) s
|
|
else utf8_length_aux 0 (r+1) s
|
|
| (n+1) r (c::s) := utf8_length_aux n r s
|
|
| n r [] := r
|
|
|
|
definition utf8_length : string → nat
|
|
| s := utf8_length_aux 0 0 (reverse s)
|