2 people like it.

Sentiment Classification with ML.Net - Sample

ML.Net sentiment classification example using Gradient Boosted trees Needs to be compiled in a dotnet core F# project Uses F# 4.1 struct tuples which is required by the ML.Net API

 1: 
 2: 
 3: 
 4: 
 5: 
 6: 
 7: 
 8: 
 9: 
10: 
11: 
12: 
13: 
14: 
15: 
16: 
17: 
18: 
19: 
20: 
21: 
22: 
23: 
24: 
25: 
26: 
27: 
28: 
29: 
30: 
31: 
32: 
33: 
34: 
35: 
36: 
37: 
38: 
39: 
40: 
41: 
42: 
43: 
44: 
45: 
46: 
47: 
48: 
49: 
50: 
51: 
52: 
53: 
54: 
55: 
56: 
57: 
58: 
59: 
60: 
61: 
62: 
63: 
64: 
65: 
66: 
67: 
68: 
69: 
70: 
71: 
72: 
73: 
74: 
75: 
76: 
77: 
78: 
79: 
80: 
81: 
82: 
83: 
84: 
85: 
86: 
87: 
88: 
module Model

open System
open Microsoft.ML
open Microsoft.ML.StaticPipe

(* 
Nuget pacakges: 
    Microsoft.ML (0.9.0)
    Microsoft.ML.StaticPipe (0.9.0)

Data:
    download test / train datasets from here:
    https://github.com/dotnet/machinelearning/blob/master/test/data/wikipedia-detox-250-line-data.tsv
    https://github.com/dotnet/machinelearning/blob/master/test/data/wikipedia-detox-250-line-test.tsv

Other Documentation:
    This sample uses the 0.9.0 'static' pipeline API and is based on MS documentation located here:
     - https://docs.microsoft.com/en-us/dotnet/machine-learning/tutorials/sentiment-analysis

     *Note: At the time of writing, the code in the above page seems to be based on v 0.7.0 and looks quite different 
     from what is shown here.

*)

let trainDataPath = @"C:\Users\fwaris\Source\Repos\MLNetTest\MLNetTestF\Data\Train.txt"
let testDataPath = @"C:\Users\fwaris\Source\Repos\MLNetTest\MLNetTestF\Data\Test.txt"
let modelPath = @"C:\Users\fwaris\Source\Repos\MLNetTest\MLNetTestF\Data\Model.zip"

//load data, train and evaluate the model
let train_and_test() = 

    let ctx = MLContext(Nullable 10)

    let reader = 
        TextLoaderStatic.CreateReader(
                            ctx, 
                            (fun (c:TextLoaderStatic.Context) -> 
                                struct (
                                    c.LoadBool(0),
                                    c.LoadText(1)
                                )),
                            separator = '\t',
                            hasHeader = true)

                          
    let trainData = reader.Read(trainDataPath)
    let testData = reader.Read(testDataPath)

    let pipeline = 
        reader
            .MakeNewEstimator()
            .Append(fun struct (lbl,text) -> 
                let features = text.FeaturizeText()
                let struct(score,probability,predictedLabel) = 
                        ctx.BinaryClassification.Trainers.FastTree(
                                lbl,
                                features,
                                numTrees= 50,
                                numLeaves = 50,
                                minDatapointsInLeaves=20
                                )
                struct(
                    lbl,
                    text,
                    features,
                    score,
                    probability,
                    predictedLabel
                    ))

    let model = pipeline.Fit(trainData)

    let predictions = model.Transform(testData)

    let label struct (lbl,text,features,score,prob,predLbl) = lbl
    let pred struct (lbl,text,features,score,prob,predLbl) = struct(score,prob,predLbl)

    let metrics = ctx.BinaryClassification.Evaluate(
                        predictions,
                        label = label,
                        pred = pred)
    printfn 
        "Accuracy =  %0.2f, AUC = %0.2f, F1 = %0.2f" 
         metrics.Accuracy
         metrics.Auc
         metrics.F1Score
                    
module Model
namespace System
namespace Microsoft
val trainDataPath : string

Full name: Model.trainDataPath
val testDataPath : string

Full name: Model.testDataPath
val modelPath : string

Full name: Model.modelPath
val train_and_test : unit -> unit

Full name: Model.train_and_test
val ctx : obj
Multiple items
type Nullable =
  static member Compare<'T> : n1:Nullable<'T> * n2:Nullable<'T> -> int
  static member Equals<'T> : n1:Nullable<'T> * n2:Nullable<'T> -> bool
  static member GetUnderlyingType : nullableType:Type -> Type

Full name: System.Nullable

--------------------
type Nullable<'T (requires default constructor and value type and 'T :> ValueType)> =
  struct
    new : value:'T -> Nullable<'T>
    member Equals : other:obj -> bool
    member GetHashCode : unit -> int
    member GetValueOrDefault : unit -> 'T + 1 overload
    member HasValue : bool
    member ToString : unit -> string
    member Value : 'T
  end

Full name: System.Nullable<_>

--------------------
Nullable()
Nullable(value: 'T) : unit
val reader : 'a
val trainData : obj
val testData : obj
val pipeline : obj
val model : obj
val predictions : obj
val metrics : obj
val printfn : format:Printf.TextWriterFormat<'T> -> 'T

Full name: Microsoft.FSharp.Core.ExtraTopLevelOperators.printfn
Raw view Test code New version

More information

Link:http://fssnip.net/7VS
Posted:6 years ago
Author:Faisal Waris
Tags: machine learning , ml.net , sentiment classification , binary classifier