blob: 64062dd3c7d837017aa8becfdb12d4fb63944412 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
|
Various Unicode-related utilities.
\begin{code}
module UnicodeUtil(
stringToUtf8
) where
#include "HsVersions.h"
import Panic ( panic )
import Char ( chr )
\end{code}
\begin{code}
stringToUtf8 :: [Int] -> String
stringToUtf8 [] = ""
stringToUtf8 (c:s)
| c >= 1 && c <= 0x7F = chr c : stringToUtf8 s
| c < 0 = panic ("charToUtf8 ("++show c++")")
| c <= 0x7FF = chr (0xC0 + c `div` 0x40 ) :
chr (0x80 + c `mod` 0x40) :
stringToUtf8 s
| c <= 0xFFFF = chr (0xE0 + c `div` 0x1000 ) :
chr (0x80 + c `div` 0x40 `mod` 0x40) :
chr (0x80 + c `mod` 0x40) :
stringToUtf8 s
| c <= 0x1FFFFF = chr (0xF0 + c `div` 0x40000 ) :
chr (0x80 + c `div` 0x1000 `mod` 0x40) :
chr (0x80 + c `div` 0x40 `mod` 0x40) :
chr (0x80 + c `mod` 0x40) :
stringToUtf8 s
| c <= 0x3FFFFFF = chr (0xF8 + c `div` 0x1000000 ) :
chr (0x80 + c `div` 0x40000 `mod` 0x40) :
chr (0x80 + c `div` 0x1000 `mod` 0x40) :
chr (0x80 + c `div` 0x40 `mod` 0x40) :
chr (0x80 + c `mod` 0x40) :
stringToUtf8 s
| c <= 0x7FFFFFFF = chr (0xFC + c `div` 0x40000000 ) :
chr (0x80 + c `div` 0x1000000 `mod` 0x40) :
chr (0x80 + c `div` 0x40000 `mod` 0x40) :
chr (0x80 + c `div` 0x1000 `mod` 0x40) :
chr (0x80 + c `div` 0x40 `mod` 0x40) :
chr (0x80 + c `mod` 0x40) :
stringToUtf8 s
| otherwise = panic ("charToUtf8 "++show c)
\end{code}
|