summaryrefslogtreecommitdiff
path: root/Assignment1/CamilStaps-assignment1-freqs.hs
blob: 6c6cd47bf82cf3db9a6f40b9f811dc2f450960f5 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
import System.Environment
import Data.String.Utils
import qualified Data.List as List

main = do
	args <- getArgs
	let input = replace " " "" (head args)
	print $ List.reverse $ List.sort $ countfreqs input 1 []
	print $ List.reverse $ List.sort $ countfreqs input 2 []
	print $ List.reverse $ List.sort $ countfreqs input 3 []

-- countfreqs s n []: calculate occurrence statistics of n-grams in s
countfreqs :: String -> Int -> [Freq] -> [Freq]
countfreqs "" _ fl = fl
countfreqs s n fl
	| length s < n = fl
	| otherwise = countfreqs (tail s) n (freqsincr fl (take n s) [])

-- freqsincr fl s []: add s to the frequencies in fl
freqsincr :: [Freq] -> String -> [Freq] -> [Freq]
freqsincr [] s fl = fl ++ [Freq { item = s, freq = 1}]
freqsincr (freq:fla) s2 flb
	| get_item freq == s2 = fla ++ flb ++ [Freq { item = s2, freq = get_freq freq + 1}]
	| otherwise = freqsincr fla s2 (flb ++ [Freq { item = get_item freq, freq = get_freq freq}])

-- Data type for keeping track of frequencies (Int) of substrings (String)
data Freq = Freq { item :: String, freq :: Int } deriving (Eq)

get_item :: Freq -> String
get_item = item

get_freq :: Freq -> Int
get_freq = freq

instance Ord Freq where
	f1 `compare` f2 = get_freq f1 `compare` get_freq f2

instance Show Freq where
	show f = get_item f ++ " (" ++ show (get_freq f) ++ "x)"