~ubuntu-branches/ubuntu/precise/ghc/precise

| otherwise = extractAnswer $ foldl' (restrictedDamerauLevenshteinDistanceWorker (matchVectors str1) top_bit_mask vector_mask) (0, 0, m_ones, 0, m) str2

714

where m_ones@vector_mask = (2 ^ m) - 1

715

top_bit_mask = (1 `shiftL` (m - 1)) `asTypeOf` _bv_dummy

716

extractAnswer (_, _, _, _, distance) = distance

717

718

restrictedDamerauLevenshteinDistanceWorker :: (Bits bv) => IM.IntMap bv -> bv -> bv -> (bv, bv, bv, bv, Int) -> Char -> (bv, bv, bv, bv, Int)

719

restrictedDamerauLevenshteinDistanceWorker str1_mvs top_bit_mask vector_mask (pm, d0, vp, vn, distance) char2

720

= seq str1_mvs $ seq top_bit_mask $ seq vector_mask $ seq pm' $ seq d0' $ seq vp' $ seq vn' $ seq distance'' $ seq char2 $ (pm', d0', vp', vn', distance'')

721

where

722

pm' = IM.findWithDefault 0 (ord char2) str1_mvs

723

724

d0' = ((((sizedComplement vector_mask d0) .&. pm') `shiftL` 1) .&. pm) -- No need to mask the shiftL because of the restricted range of pm

725

.|. ((((pm' .&. vp) + vp) .&. vector_mask) `xor` vp) .|. pm' .|. vn

726

hp' = vn .|. sizedComplement vector_mask (d0' .|. vp)

727

hn' = d0' .&. vp

728

729

hp'_shift = ((hp' `shiftL` 1) .|. 1) .&. vector_mask

730

hn'_shift = (hn' `shiftL` 1) .&. vector_mask

731

vp' = hn'_shift .|. sizedComplement vector_mask (d0' .|. hp'_shift)

732

vn' = d0' .&. hp'_shift

733

734

distance' = if hp' .&. top_bit_mask /= 0 then distance + 1 else distance

735

distance'' = if hn' .&. top_bit_mask /= 0 then distance' - 1 else distance'

736

737

sizedComplement :: Bits bv => bv -> bv -> bv

738

sizedComplement vector_mask vect = vector_mask `xor` vect

739

740

matchVectors :: Bits bv => String -> IM.IntMap bv

741

matchVectors = snd . foldl' go (0 :: Int, IM.empty)

742

where

743

go (ix, im) char = let ix' = ix + 1

744

im' = IM.insertWith (.|.) (ord char) (2 ^ ix) im

745

in seq ix' $ seq im' $ (ix', im')

746

747

#ifdef __GLASGOW_HASKELL__

748

{-# SPECIALIZE INLINE restrictedDamerauLevenshteinDistance' :: Word32 -> Int -> Int -> String -> String -> Int #-}

749

{-# SPECIALIZE INLINE restrictedDamerauLevenshteinDistance' :: Integer -> Int -> Int -> String -> String -> Int #-}

750

751

{-# SPECIALIZE restrictedDamerauLevenshteinDistanceWorker :: IM.IntMap Word32 -> Word32 -> Word32 -> (Word32, Word32, Word32, Word32, Int) -> Char -> (Word32, Word32, Word32, Word32, Int) #-}

752

{-# SPECIALIZE restrictedDamerauLevenshteinDistanceWorker :: IM.IntMap Integer -> Integer -> Integer -> (Integer, Integer, Integer, Integer, Int) -> Char -> (Integer, Integer, Integer, Integer, Int) #-}

753

754

{-# SPECIALIZE INLINE sizedComplement :: Word32 -> Word32 -> Word32 #-}

755

{-# SPECIALIZE INLINE sizedComplement :: Integer -> Integer -> Integer #-}

756

757

{-# SPECIALIZE matchVectors :: String -> IM.IntMap Word32 #-}

758

{-# SPECIALIZE matchVectors :: String -> IM.IntMap Integer #-}

759

#endif

760

761

-- | Search for possible matches to the users input in the given list, returning a small number of ranked results

762

fuzzyMatch :: String -> [String] -> [String]

763

fuzzyMatch user_entered possibilites = map fst $ take mAX_RESULTS $ sortBy (comparing snd)

764

[ (poss, distance) | poss <- possibilites

765

, let distance = restrictedDamerauLevenshteinDistance poss user_entered

766

, distance <= fuzzy_threshold ]

767

where -- Work out an approriate match threshold (about a quarter of the # of characters the user entered)

768

fuzzy_threshold = max (round $ fromInteger (genericLength user_entered) / (4 :: Rational)) 1

769

mAX_RESULTS = 3

770

\end{code}

771

772

%************************************************************************

773

%* *

774

\subsection[Utils-pairs]{Pairs}

775

%* *

776

%************************************************************************

777

778

\begin{code}

779

unzipWith :: (a -> b -> c) -> [(a, b)] -> [c]

780

unzipWith f pairs = map ( \ (a, b) -> f a b ) pairs

781

\end{code}

782

783

\begin{code}

784

seqList :: [a] -> b -> b

785

seqList [] b = b

786

seqList (x:xs) b = x `seq` seqList xs b

787

\end{code}

788

789

Global variables:

790

791

\begin{code}

792

global :: a -> IORef a

793

global a = unsafePerformIO (newIORef a)

794

\end{code}

795

796

\begin{code}

797

consIORef :: IORef [a] -> a -> IO ()

798

consIORef var x = do

799

atomicModifyIORef var (\xs -> (x:xs,()))

800

\end{code}

801

802

\begin{code}

803

globalMVar :: a -> MVar a

804

globalMVar a = unsafePerformIO (newMVar a)

805

806

globalEmptyMVar :: MVar a

807

globalEmptyMVar = unsafePerformIO newEmptyMVar

808

\end{code}

809

810

Module names:

811

812

\begin{code}

813

looksLikeModuleName :: String -> Bool

814

looksLikeModuleName [] = False

815

looksLikeModuleName (c:cs) = isUpper c && go cs

816

where go [] = True

817

go ('.':cs) = looksLikeModuleName cs

818

go (c:cs) = (isAlphaNum c || c == '_' || c == '\'') && go cs

819

\end{code}

820

821

Akin to @Prelude.words@, but acts like the Bourne shell, treating

822

quoted strings as Haskell Strings, and also parses Haskell [String]

823

syntax.

824

825

\begin{code}

826

getCmd :: String -> Either String -- Error

827

(String, String) -- (Cmd, Rest)

828

getCmd s = case break isSpace $ dropWhile isSpace s of

829

([], _) -> Left ("Couldn't find command in " ++ show s)

830

res -> Right res

831

832

toCmdArgs :: String -> Either String -- Error

833

(String, [String]) -- (Cmd, Args)

834

toCmdArgs s = case getCmd s of

835

Left err -> Left err

836

Right (cmd, s') -> case toArgs s' of

837

Left err -> Left err

838

Right args -> Right (cmd, args)

839

840

toArgs :: String -> Either String -- Error

841

[String] -- Args

842

toArgs str

843

= case dropWhile isSpace str of

844

s@('[':_) -> case reads s of

845

[(args, spaces)]

846

| all isSpace spaces ->

847

Right args

848

_ ->

849

Left ("Couldn't read " ++ show str ++ "as [String]")

850

s -> toArgs' s

851

where

852

toArgs' s = case dropWhile isSpace s of

853

[] -> Right []

854

('"' : _) -> case reads s of

855

[(arg, rest)]

856

-- rest must either be [] or start with a space

857

| all isSpace (take 1 rest) ->

858

case toArgs' rest of

859

Left err -> Left err

860

Right args -> Right (arg : args)

861

_ ->

862

Left ("Couldn't read " ++ show s ++ "as String")

863

s' -> case break isSpace s' of

864

(arg, s'') -> case toArgs' s'' of

865

Left err -> Left err

866

Right args -> Right (arg : args)

867

\end{code}

868

869

-- -----------------------------------------------------------------------------

870

-- Floats

871

872

\begin{code}

873

readRational__ :: ReadS Rational -- NB: doesn't handle leading "-"

874

readRational__ r = do

875

(n,d,s) <- readFix r

876

(k,t) <- readExp s

877

return ((n%1)*10^^(k-d), t)

878

where

879

readFix r = do

880

(ds,s) <- lexDecDigits r

881

(ds',t) <- lexDotDigits s

882

return (read (ds++ds'), length ds', t)

883

884

readExp (e:s) | e `elem` "eE" = readExp' s

885

readExp s = return (0,s)

886

887

readExp' ('+':s) = readDec s

888

readExp' ('-':s) = do (k,t) <- readDec s

889

return (-k,t)

890

readExp' s = readDec s

891

892

readDec s = do

893

(ds,r) <- nonnull isDigit s

894

return (foldl1 (\n d -> n * 10 + d) [ ord d - ord '0' | d <- ds ],

895

896

897

lexDecDigits = nonnull isDigit

898

899

lexDotDigits ('.':s) = return (span isDigit s)

900

lexDotDigits s = return ("",s)

901

902

nonnull p s = do (cs@(_:_),t) <- return (span p s)

903

return (cs,t)

904

905

readRational :: String -> Rational -- NB: *does* handle a leading "-"

906

readRational top_s

907

= case top_s of

908

'-' : xs -> - (read_me xs)

909

xs -> read_me xs

910

where

911

read_me s

912

= case (do { (x,"") <- readRational__ s ; return x }) of

913

[x] -> x

914

[] -> error ("readRational: no parse:" ++ top_s)

915

_ -> error ("readRational: ambiguous parse:" ++ top_s)

916

917

918

-----------------------------------------------------------------------------

919

-- Create a hierarchy of directories

920

921

createDirectoryHierarchy :: FilePath -> IO ()

922

createDirectoryHierarchy dir | isDrive dir = return () -- XXX Hack

923

createDirectoryHierarchy dir = do

924

b <- doesDirectoryExist dir

925

unless b $ do createDirectoryHierarchy (takeDirectory dir)

926

createDirectory dir

927

928

-----------------------------------------------------------------------------

929

-- Verify that the 'dirname' portion of a FilePath exists.

930

931

doesDirNameExist :: FilePath -> IO Bool

932

doesDirNameExist fpath = case takeDirectory fpath of

933

"" -> return True -- XXX Hack

934

_ -> doesDirectoryExist (takeDirectory fpath)

935

936

-- --------------------------------------------------------------

937

-- check existence & modification time at the same time

938

939

modificationTimeIfExists :: FilePath -> IO (Maybe ClockTime)

940

modificationTimeIfExists f = do

941

(do t <- getModificationTime f; return (Just t))

942

`IO.catch` \e -> if isDoesNotExistError e

943

then return Nothing

944

else ioError e

945

946

-- split a string at the last character where 'pred' is True,

947

-- returning a pair of strings. The first component holds the string

948

-- up (but not including) the last character for which 'pred' returned

949

-- True, the second whatever comes after (but also not including the

950

-- last character).

951

952

-- If 'pred' returns False for all characters in the string, the original

953

-- string is returned in the first component (and the second one is just

954

-- empty).

955

splitLongestPrefix :: String -> (Char -> Bool) -> (String,String)

956

splitLongestPrefix str pred

957

| null r_pre = (str, [])

958

| otherwise = (reverse (tail r_pre), reverse r_suf)

959

-- 'tail' drops the char satisfying 'pred'

960

where (r_suf, r_pre) = break pred (reverse str)

961

962

escapeSpaces :: String -> String

963

escapeSpaces = foldr (\c s -> if isSpace c then '\\':c:s else c:s) ""

964

965

type Suffix = String

966

967

--------------------------------------------------------------

968

-- * Search path

969

--------------------------------------------------------------

970

971

-- | The function splits the given string to substrings

972

-- using the 'searchPathSeparator'.

973

parseSearchPath :: String -> [FilePath]

974

parseSearchPath path = split path

975

where

976

split :: String -> [String]

977

split s =

978

case rest' of

979

[] -> [chunk]

980

_:rest -> chunk : split rest

981

where

982

chunk =

983

case chunk' of

984

#ifdef mingw32_HOST_OS

985

('\"':xs@(_:_)) | last xs == '\"' -> init xs

986

#endif

987

_ -> chunk'

988

989

(chunk', rest') = break isSearchPathSeparator s

990

991

data Direction = Forwards | Backwards

992

993

reslash :: Direction -> FilePath -> FilePath

994

reslash d = f

995

where f ('/' : xs) = slash : f xs

996

f ('\\' : xs) = slash : f xs

997

f (x : xs) = x : f xs

998

f "" = ""

999

slash = case d of

1000

Forwards -> '/'

1001

Backwards -> '\\'

1002

\end{code}

1003

1004

%************************************************************************

1005

%* *

1006

\subsection[Utils-Data]{Utils for defining Data instances}

1007

%* *

1008

%************************************************************************

1009

1010

These functions helps us to define Data instances for abstract types.

1011

1012

\begin{code}

1013

abstractConstr :: String -> Constr

1014

abstractConstr n = mkConstr (abstractDataType n) ("{abstract:"++n++"}") [] Prefix

1015

\end{code}

1016

1017

\begin{code}

1018

abstractDataType :: String -> DataType

1019

abstractDataType n = mkDataType n [abstractConstr n]

1020

\end{code}

1021

1022

\begin{code}

1023

-- Old GHC versions come with a base library with this function misspelled.

1024

#if __GLASGOW_HASKELL__ < 612

1025

mkNoRepType :: String -> DataType

1026

mkNoRepType = mkNorepType

1027

#endif

1028

\end{code}

1029

Older »