adding all of botlist, initial add
[botlist.git] / botlistprojects / botspider / spider / lib / haskell / src / Data / SpiderNet / DocumentInfo.hs
blobecc3f9747a15f93cf6b11bc6e6989de6d6e0e7da
1 --
2 --
3 module Data.SpiderNet.DocumentInfo (DocumentInfo(DocumentInfo), trainCatName, trainBayesProb, trainFisherProb,trainFeatureProb,
4 DocTrainInfo(DocTrainInfo), docName, docCharLen, docTokenLen, formatTrainInfo,
5 docWordDensity, docTrainInfo, docStopWordDensity, docPageInfo, docIsValidPage) where
6 import System.Environment
7 import Text.Printf
8 import Data.Char
9 import Data.SpiderNet.PageInfo
11 data DocTrainInfo = DocTrainInfo {
12 trainCatName :: String,
13 trainBayesProb :: Double,
14 trainFisherProb :: Double,
15 trainFeatureProb :: Double
17 data DocumentInfo = DocumentInfo {
18 docName :: String,
19 docCharLen :: Integer,
20 docTokenLen :: Integer,
21 docWordDensity :: Double,
22 docStopWordDensity :: Double,
23 docTrainInfo :: [DocTrainInfo],
24 docPageInfo :: PageURLFieldInfo,
25 docIsValidPage :: Bool
28 formatTrainInfo :: [DocTrainInfo] -> String
29 formatTrainInfo [] = ""
30 formatTrainInfo (x:xs) = (show x) ++ formatTrainInfo xs
32 instance Show DocumentInfo where
33 show info = (printf "%s,%d,%d,%f,%f,%s,"
34 (docName info) (docCharLen info) (docTokenLen info)
35 (docWordDensity info) (docStopWordDensity info)
36 (show (docIsValidPage info)))
38 instance Show DocTrainInfo where
39 show info = (printf "%s,%f,%f,%f,"
40 (trainCatName info) (trainBayesProb info) (trainFisherProb info)
41 (trainFeatureProb info))
43 -- End of File