TraceLab Component Library
 All Classes Namespaces Files Functions Variables Enumerations Enumerator Properties
TermDocumentMatrixImporter.cs
Go to the documentation of this file.
1 // TraceLab Component Library
2 // Copyright © 2012-2013 SEMERU
3 //
4 // This program is free software: you can redistribute it and/or modify
5 // it under the terms of the GNU General Public License as published by
6 // the Free Software Foundation, either version 3 of the License, or
7 // (at your option) any later version.
8 //
9 // This program is distributed in the hope that it will be useful,
10 // but WITHOUT ANY WARRANTY; without even the implied warranty of
11 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 // GNU General Public License for more details.
13 //
14 // You should have received a copy of the GNU General Public License
15 // along with this program. If not, see <http://www.gnu.org/licenses/>.
16 
17 using System.ComponentModel;
18 using TraceLab.Components.DevelopmentKit;
19 using TraceLabSDK;
20 using TraceLabSDK.Component.Config;
21 using TraceLabSDK.Types;
22 
23 namespace TraceLab.Components.Library.Importers.Artifacts
24 {
25  [Component(Name = "TermDocumentMatrix Importer",
26  Description = "Imports a document corpus in the form of a tab-delimited document-by-term matrix and outputs a TLArtifactsCollection",
27  Author = "SEMERU; Evan Moritz",
28  Version = "1.0.0.0",
29  ConfigurationType = typeof(TermDocumentMatrixConfig))]
30  [IOSpec(IOSpecType.Output, "Artifacts", typeof(TLArtifactsCollection))]
31  [Tag("Importers.TLArtifactsCollection.From TXT")]
32  public class TermDocumentMatrixImporter : BaseComponent
33  {
34  private TermDocumentMatrixConfig _config;
35 
36  public TermDocumentMatrixImporter(ComponentLogger log)
37  : base(log)
38  {
39  _config = new TermDocumentMatrixConfig();
40  Configuration = _config;
41  }
42 
43  public override void Compute()
44  {
45  Workspace.Store("Artifacts", TermDocumentMatrix.Load(_config.CorpusDocument.Absolute).ToTLArtifactsCollection());
46  }
47  }
48 
50  {
51  [DisplayName("Document matrix")]
52  [Description("Corpus file location")]
53  public FilePath CorpusDocument { get; set; }
54  }
55 }