#MLNET – New version 0.4, news Improvements in Text analysis using Word Embedding

Pingback: #MLNet – Agregando paquetes en modo Preview desde MyGet, por ejemplo Microsoft.ML -Version 0.6.0 – El Bruno

Pingback: #MLNet – Adding NuGet Packages in Preview mode from MyGet, ie: Microsoft.ML-0.6.0 Version – El Bruno

Pingback: #MLNET – Solución para el error [System.InvalidOperationException, Entry point ‘ not found] al momento de entrenar un Pipeline – El Bruno

Pingback: #MLNET – Fix the error [System. InvalidOperationException, Entry Point ‘ Not found] when you train a pipeline – El Bruno

Pingback: #MLNET – Cambios en la API con la nueva version 0.6.0 – El Bruno

Pingback: #MLNET – API improvements in the new 0.6.0 version – El Bruno

Pingback: #MLNET – Analizando datos de la Pipeline con la nueva version API 0.6.0 (gracias LINQ!) – El Bruno

Pingback: #MLNET – Analyzing pipeline data in Machine Learning.Net using the new API 0.6.0 (thanks LINQ!) – El Bruno

Pingback: #MLNET – Novedades en la version 0.7 de Machine Learning.Net (la excusa perfecta para actualizar proximos eventos!) – El Bruno

Pingback: #MLNET – New version 0.7 for Machine Learning.Net (the perfect excuse to update my content for next events!) – El Bruno

Pingback: #MLNet – Visualizando datos del Pipeline en la versión 0.7.0 – El Bruno

Pingback: #MLNet – Looking at data in the Pipeline in version 0.7.0 – El Bruno

	internal static class Program
	{
	private static PredictionModel<SentimentData, SentimentPrediction> _model;
	private static PredictionModel<SentimentData, SentimentPrediction> _modelWordEmbeddings;
	private static string AppPath => Path.GetDirectoryName(Environment.GetCommandLineArgs()[0]);
	private static string TrainDataPath => Path.Combine(AppPath, "datasets", "sentiment-imdb-train.txt");
	private static string TestDataPath => Path.Combine(AppPath, "datasets", "sentiment-yelp-test.txt");
	private static string ModelPath => Path.Combine(AppPath, "SentimentModel.zip");

	private static void Main(string[] args)
	{
	TrainModel();
	TrainModelWordEmbeddings();

	Evaluate(_model, "normal");
	Evaluate(_modelWordEmbeddings, "using WordEmbeddings");

	Console.ReadLine();
	}

	public static void TrainModel()
	{
	var pipeline = new LearningPipeline();
	pipeline.Add(new TextLoader(TrainDataPath).CreateFrom<SentimentData>());
	pipeline.Add(new TextFeaturizer("Features", "SentimentText"));
	pipeline.Add(new FastTreeBinaryClassifier() { NumLeaves = 5, NumTrees = 5, MinDocumentsInLeafs = 2 });
	Console.WriteLine("=============== Training model ===============");
	var model = pipeline.Train<SentimentData, SentimentPrediction>();
	Console.WriteLine("=============== End training ===============");
	_model = model;
	}

	public static void TrainModelWordEmbeddings()
	{
	var pipeline = new LearningPipeline();
	pipeline.Add(new TextLoader(TrainDataPath).CreateFrom<SentimentData>());
	pipeline.Add(new TextFeaturizer("FeaturesA", "SentimentText") { OutputTokens = true });
	pipeline.Add(new WordEmbeddings(("FeaturesA_TransformedText", "FeaturesB")));
	pipeline.Add(new ColumnConcatenator("Features", "FeaturesA", "FeaturesB"));
	pipeline.Add(new FastTreeBinaryClassifier() { NumLeaves = 5, NumTrees = 5, MinDocumentsInLeafs = 2 });
	Console.WriteLine("=============== Training model with Word Embeddings ===============");
	var model = pipeline.Train<SentimentData, SentimentPrediction>();
	Console.WriteLine("=============== End training ===============");
	_modelWordEmbeddings = model;
	}

	private static void Evaluate(PredictionModel<SentimentData, SentimentPrediction> model, string name)
	{
	var testData = new TextLoader(TestDataPath).CreateFrom<SentimentData>();
	var evaluator = new BinaryClassificationEvaluator();
	Console.WriteLine("=============== Evaluating model {0} ===============", name);
	var metrics = evaluator.Evaluate(model, testData);
	Console.WriteLine($"Accuracy: {metrics.Accuracy:P2}");
	Console.WriteLine($"Auc: {metrics.Auc:P2}");
	Console.WriteLine($"F1Score: {metrics.F1Score:P2}");
	Console.WriteLine("=============== End evaluating ===============");
	Console.WriteLine();
	}
	}

#MLNET – New version 0.4, news Improvements in Text analysis using Word Embedding

12 comments

Leave a comment Cancel reply

Share this:

Related

12 comments

Leave a comment Cancel reply