<?xml version="1.0" encoding="UTF-8"?> <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> <html> <head> <!-- Generated by HsColour, http://www.cs.york.ac.uk/fp/darcs/hscolour/ --> <title>Data/Text/UnsafeChar.hs</title> <link type='text/css' rel='stylesheet' href='hscolour.css' /> </head> <body> <pre><a name="line-1"></a><span class='hs-comment'>{-# LANGUAGE CPP, MagicHash #-}</span> <a name="line-2"></a> <a name="line-3"></a><span class='hs-comment'>-- |</span> <a name="line-4"></a><span class='hs-comment'>-- Module : Data.Text.UnsafeChar</span> <a name="line-5"></a><span class='hs-comment'>-- Copyright : (c) 2008, 2009 Tom Harper,</span> <a name="line-6"></a><span class='hs-comment'>-- (c) 2009, 2010 Bryan O'Sullivan,</span> <a name="line-7"></a><span class='hs-comment'>-- (c) 2009 Duncan Coutts</span> <a name="line-8"></a><span class='hs-comment'>--</span> <a name="line-9"></a><span class='hs-comment'>-- License : BSD-style</span> <a name="line-10"></a><span class='hs-comment'>-- Maintainer : bos@serpentine.com, rtomharper@googlemail.com,</span> <a name="line-11"></a><span class='hs-comment'>-- duncan@haskell.org</span> <a name="line-12"></a><span class='hs-comment'>-- Stability : experimental</span> <a name="line-13"></a><span class='hs-comment'>-- Portability : GHC</span> <a name="line-14"></a><span class='hs-comment'>--</span> <a name="line-15"></a><span class='hs-comment'>-- Fast character manipulation functions.</span> <a name="line-16"></a><span class='hs-keyword'>module</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>UnsafeChar</span> <a name="line-17"></a> <span class='hs-layout'>(</span> <a name="line-18"></a> <span class='hs-varid'>ord</span> <a name="line-19"></a> <span class='hs-layout'>,</span> <span class='hs-varid'>unsafeChr</span> <a name="line-20"></a> <span class='hs-layout'>,</span> <span class='hs-varid'>unsafeChr8</span> <a name="line-21"></a> <span class='hs-layout'>,</span> <span class='hs-varid'>unsafeChr32</span> <a name="line-22"></a> <span class='hs-layout'>,</span> <span class='hs-varid'>unsafeWrite</span> <a name="line-23"></a> <span class='hs-comment'>-- , unsafeWriteRev</span> <a name="line-24"></a> <span class='hs-layout'>)</span> <span class='hs-keyword'>where</span> <a name="line-25"></a> <a name="line-26"></a><span class='hs-cpp'>#ifdef ASSERTS</span> <a name="line-27"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Control</span><span class='hs-varop'>.</span><span class='hs-conid'>Exception</span> <span class='hs-layout'>(</span><span class='hs-varid'>assert</span><span class='hs-layout'>)</span> <a name="line-28"></a><span class='hs-cpp'>#endif</span> <a name="line-29"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Control</span><span class='hs-varop'>.</span><span class='hs-conid'>Monad</span><span class='hs-varop'>.</span><span class='hs-conid'>ST</span> <span class='hs-layout'>(</span><span class='hs-conid'>ST</span><span class='hs-layout'>)</span> <a name="line-30"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>Bits</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varop'>.&.</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-31"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>UnsafeShift</span> <span class='hs-layout'>(</span><span class='hs-varid'>shiftR</span><span class='hs-layout'>)</span> <a name="line-32"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>GHC</span><span class='hs-varop'>.</span><span class='hs-conid'>Exts</span> <span class='hs-layout'>(</span><span class='hs-conid'>Char</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span> <span class='hs-conid'>Int</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span> <span class='hs-varid'>chr</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-varid'>ord</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <a name="line-33"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>GHC</span><span class='hs-varop'>.</span><span class='hs-conid'>Word</span> <span class='hs-layout'>(</span><span class='hs-conid'>Word8</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span> <span class='hs-conid'>Word16</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span> <span class='hs-conid'>Word32</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-34"></a><span class='hs-keyword'>import</span> <span class='hs-keyword'>qualified</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Array</span> <span class='hs-keyword'>as</span> <span class='hs-conid'>A</span> <a name="line-35"></a> <a name="line-36"></a><a name="ord"></a><span class='hs-definition'>ord</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Int</span> <a name="line-37"></a><span class='hs-definition'>ord</span> <span class='hs-layout'>(</span><span class='hs-conid'>C</span><span class='hs-cpp'>#</span> <span class='hs-varid'>c</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>I</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>ord</span><span class='hs-cpp'>#</span> <span class='hs-varid'>c</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <a name="line-38"></a><span class='hs-comment'>{-# INLINE ord #-}</span> <a name="line-39"></a> <a name="line-40"></a><a name="unsafeChr"></a><span class='hs-definition'>unsafeChr</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Word16</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Char</span> <a name="line-41"></a><span class='hs-definition'>unsafeChr</span> <span class='hs-layout'>(</span><span class='hs-conid'>W16</span><span class='hs-cpp'>#</span> <span class='hs-varid'>w</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>C</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>chr</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-varid'>w</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-42"></a><span class='hs-comment'>{-# INLINE unsafeChr #-}</span> <a name="line-43"></a> <a name="line-44"></a><a name="unsafeChr8"></a><span class='hs-definition'>unsafeChr8</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Char</span> <a name="line-45"></a><span class='hs-definition'>unsafeChr8</span> <span class='hs-layout'>(</span><span class='hs-conid'>W8</span><span class='hs-cpp'>#</span> <span class='hs-varid'>w</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>C</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>chr</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-varid'>w</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-46"></a><span class='hs-comment'>{-# INLINE unsafeChr8 #-}</span> <a name="line-47"></a> <a name="line-48"></a><a name="unsafeChr32"></a><span class='hs-definition'>unsafeChr32</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Word32</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Char</span> <a name="line-49"></a><span class='hs-definition'>unsafeChr32</span> <span class='hs-layout'>(</span><span class='hs-conid'>W32</span><span class='hs-cpp'>#</span> <span class='hs-varid'>w</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>C</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>chr</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-varid'>w</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-50"></a><span class='hs-comment'>{-# INLINE unsafeChr32 #-}</span> <a name="line-51"></a> <a name="line-52"></a><a name="unsafeWrite"></a><span class='hs-comment'>-- | Write a character into the array at the given offset. Returns</span> <a name="line-53"></a><span class='hs-comment'>-- the number of 'Word16's written.</span> <a name="line-54"></a><span class='hs-definition'>unsafeWrite</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>A</span><span class='hs-varop'>.</span><span class='hs-conid'>MArray</span> <span class='hs-varid'>s</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Int</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>ST</span> <span class='hs-varid'>s</span> <span class='hs-conid'>Int</span> <a name="line-55"></a><span class='hs-definition'>unsafeWrite</span> <span class='hs-varid'>marr</span> <span class='hs-varid'>i</span> <span class='hs-varid'>c</span> <a name="line-56"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>n</span> <span class='hs-varop'><</span> <span class='hs-num'>0x10000</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>do</span> <a name="line-57"></a><span class='hs-cpp'>#if defined(ASSERTS)</span> <a name="line-58"></a> <span class='hs-varid'>assert</span> <span class='hs-layout'>(</span><span class='hs-varid'>i</span> <span class='hs-varop'>>=</span> <span class='hs-num'>0</span><span class='hs-layout'>)</span> <span class='hs-varop'>.</span> <span class='hs-varid'>assert</span> <span class='hs-layout'>(</span><span class='hs-varid'>i</span> <span class='hs-varop'><</span> <span class='hs-conid'>A</span><span class='hs-varop'>.</span><span class='hs-varid'>length</span> <span class='hs-varid'>marr</span><span class='hs-layout'>)</span> <span class='hs-varop'>$</span> <span class='hs-varid'>return</span> <span class='hs-conid'>()</span> <a name="line-59"></a><span class='hs-cpp'>#endif</span> <a name="line-60"></a> <span class='hs-conid'>A</span><span class='hs-varop'>.</span><span class='hs-varid'>unsafeWrite</span> <span class='hs-varid'>marr</span> <span class='hs-varid'>i</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-varid'>n</span><span class='hs-layout'>)</span> <a name="line-61"></a> <span class='hs-varid'>return</span> <span class='hs-num'>1</span> <a name="line-62"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>do</span> <a name="line-63"></a><span class='hs-cpp'>#if defined(ASSERTS)</span> <a name="line-64"></a> <span class='hs-varid'>assert</span> <span class='hs-layout'>(</span><span class='hs-varid'>i</span> <span class='hs-varop'>>=</span> <span class='hs-num'>0</span><span class='hs-layout'>)</span> <span class='hs-varop'>.</span> <span class='hs-varid'>assert</span> <span class='hs-layout'>(</span><span class='hs-varid'>i</span> <span class='hs-varop'><</span> <span class='hs-conid'>A</span><span class='hs-varop'>.</span><span class='hs-varid'>length</span> <span class='hs-varid'>marr</span> <span class='hs-comment'>-</span> <span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-varop'>$</span> <span class='hs-varid'>return</span> <span class='hs-conid'>()</span> <a name="line-65"></a><span class='hs-cpp'>#endif</span> <a name="line-66"></a> <span class='hs-conid'>A</span><span class='hs-varop'>.</span><span class='hs-varid'>unsafeWrite</span> <span class='hs-varid'>marr</span> <span class='hs-varid'>i</span> <span class='hs-varid'>lo</span> <a name="line-67"></a> <span class='hs-conid'>A</span><span class='hs-varop'>.</span><span class='hs-varid'>unsafeWrite</span> <span class='hs-varid'>marr</span> <span class='hs-layout'>(</span><span class='hs-varid'>i</span><span class='hs-varop'>+</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-varid'>hi</span> <a name="line-68"></a> <span class='hs-varid'>return</span> <span class='hs-num'>2</span> <a name="line-69"></a> <span class='hs-keyword'>where</span> <span class='hs-varid'>n</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>ord</span> <span class='hs-varid'>c</span> <a name="line-70"></a> <span class='hs-varid'>m</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>n</span> <span class='hs-comment'>-</span> <span class='hs-num'>0x10000</span> <a name="line-71"></a> <span class='hs-varid'>lo</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>fromIntegral</span> <span class='hs-varop'>$</span> <span class='hs-layout'>(</span><span class='hs-varid'>m</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>10</span><span class='hs-layout'>)</span> <span class='hs-varop'>+</span> <span class='hs-num'>0xD800</span> <a name="line-72"></a> <span class='hs-varid'>hi</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>fromIntegral</span> <span class='hs-varop'>$</span> <span class='hs-layout'>(</span><span class='hs-varid'>m</span> <span class='hs-varop'>.&.</span> <span class='hs-num'>0x3FF</span><span class='hs-layout'>)</span> <span class='hs-varop'>+</span> <span class='hs-num'>0xDC00</span> <a name="line-73"></a><span class='hs-comment'>{-# INLINE unsafeWrite #-}</span> <a name="line-74"></a> <a name="line-75"></a><span class='hs-comment'>{- <a name="line-76"></a>unsafeWriteRev :: A.MArray s Word16 -> Int -> Char -> ST s Int <a name="line-77"></a>unsafeWriteRev marr i c <a name="line-78"></a> | n < 0x10000 = do <a name="line-79"></a> assert (i >= 0) . assert (i < A.length marr) $ <a name="line-80"></a> A.unsafeWrite marr i (fromIntegral n) <a name="line-81"></a> return (i-1) <a name="line-82"></a> | otherwise = do <a name="line-83"></a> assert (i >= 1) . assert (i < A.length marr) $ <a name="line-84"></a> A.unsafeWrite marr (i-1) lo <a name="line-85"></a> A.unsafeWrite marr i hi <a name="line-86"></a> return (i-2) <a name="line-87"></a> where n = ord c <a name="line-88"></a> m = n - 0x10000 <a name="line-89"></a> lo = fromIntegral $ (m `shiftR` 10) + 0xD800 <a name="line-90"></a> hi = fromIntegral $ (m .&. 0x3FF) + 0xDC00 <a name="line-91"></a>{-# INLINE unsafeWriteRev #-} <a name="line-92"></a>-}</span> </pre></body> </html>