3 module Data
.SpiderNet
.DocumentInfo
(DocumentInfo
(DocumentInfo
), trainCatName
, trainBayesProb
, trainFisherProb
,trainFeatureProb
,
4 DocTrainInfo
(DocTrainInfo
), docName
, docCharLen
, docTokenLen
, formatTrainInfo
,
5 docWordDensity
, docTrainInfo
, docStopWordDensity
, docPageInfo
, docIsValidPage
) where
6 import System
.Environment
9 import Data
.SpiderNet
.PageInfo
11 data DocTrainInfo
= DocTrainInfo
{
12 trainCatName
:: String,
13 trainBayesProb
:: Double,
14 trainFisherProb
:: Double,
15 trainFeatureProb
:: Double
17 data DocumentInfo
= DocumentInfo
{
19 docCharLen
:: Integer,
20 docTokenLen
:: Integer,
21 docWordDensity
:: Double,
22 docStopWordDensity
:: Double,
23 docTrainInfo
:: [DocTrainInfo
],
24 docPageInfo
:: PageURLFieldInfo
,
25 docIsValidPage
:: Bool
28 formatTrainInfo
:: [DocTrainInfo
] -> String
29 formatTrainInfo
[] = ""
30 formatTrainInfo
(x
:xs
) = (show x
) ++ formatTrainInfo xs
32 instance Show DocumentInfo
where
33 show info
= (printf
"%s,%d,%d,%f,%f,%s,"
34 (docName info
) (docCharLen info
) (docTokenLen info
)
35 (docWordDensity info
) (docStopWordDensity info
)
36 (show (docIsValidPage info
)))
38 instance Show DocTrainInfo
where
39 show info
= (printf
"%s,%f,%f,%f,"
40 (trainCatName info
) (trainBayesProb info
) (trainFisherProb info
)
41 (trainFeatureProb info
))