Blame view

tools/sctk-2.4.10/src/asclite/core/speechset.h 4.22 KB
8dcb6dfcb   Yannick Estève   first commit
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
  /*
   * ASCLITE
   * Author: Jerome Ajot, Jon Fiscus, Nicolas Radde, Chris Laprun
   *
   * This software was developed at the National Institute of Standards and Technology by 
   * employees of the Federal Government in the course of their official duties. Pursuant
   * to title 17 Section 105 of the United States Code this software is not subject to
   * copyright protection and is in the public domain. ASCLITE is an experimental system.
   * NIST assumes no responsibility whatsoever for its use by other parties, and makes no
   * guarantees, expressed or implied, about its quality, reliability, or any other
   * characteristic. We would appreciate acknowledgement if the software is used.
   *
   * THIS SOFTWARE IS PROVIDED "AS IS."  With regard to this software, NIST MAKES NO EXPRESS
   * OR IMPLIED WARRANTY AS TO ANY MATTER WHATSOEVER, INCLUDING MERCHANTABILITY,
   * OR FITNESS FOR A PARTICULAR PURPOSE.
   */
  
  #ifndef SPEECHSET_H
  #define SPEECHSET_H
  
  #include "stdinc.h"
  #include "speech.h"
  #include "logger.h"
  
  typedef struct CATEGORYLABEL
  {
  	string type, id, title, desc;
  } stcCategoryLabel;
  
  /**
   * A speech set represent all the data from one source (reference, participant)
   * it's a collection of Speech(Speaker) from one source.
   */
  class SpeechSet
  {
  	public:
  		// class constructors
  		SpeechSet(const string& sourceFileName = "DEFAULT_FILE_NAME");
  		// class destructor
  		~SpeechSet();
  		/**
  		 * Return the nb of Speech contain in this set
  		 */
  		size_t GetNumberOfSpeech() { return speeches.size(); }
  		/**
  		 * Return the speech number i in the set
  		 */
  		Speech* GetSpeech(const size_t& index) {  return speeches[index]; }
  		/**
  		 * Add a speech into the set
  		 */
  		void AddSpeech(Speech* speech) { speeches.push_back(speech); }
  		/**
  		 * Return true id the set contain only references
  		 */
  		bool IsRef() { return ref; }
  		/**
  		 * Return true id the set contain only hypothesis
  		 */
  		bool IsHyp() { return hyp; }
  		bool IsGen() { return gen; }
  		/**
  		 * Set the hyp/ref status of this set
  		 */
  		void SetOrigin(const string& status);
  		/** Determines if case is taken into account to align Tokens part of this Speech. */
  		bool PerformCaseSensitiveAlignment();
  		/** Determines if fragments are considered as correct when aligning Tokens part of this Speech. */
  		bool AreFragmentsCorrect();
  		/** Determines if optionally deletable Tokens need to be accounted for. */
  		bool UseOptionallyDeletable();
  		
  		/** Retrieves the name of the file from which this SpeechSet originated. */
  		string GetSourceFileName() { return fileName; }
  		
  		bool HasInterSegmentGap();
  		
  		int GetMinTokensTime();
  		int GetMaxTokensTime();
  		
  		void SetTitle(const string& title) { titleName = title; }
  		string GetTitle() { return titleName; }
  		
  		void AddLabelCategory(const string& type, const string& id, const string& title, const string& desc);
  		
  		size_t GetNumberCategoryLabel() { return m_VectCategoryLabel.size(); }
  		string GetCategoryLabelType(const size_t& ind) { return m_VectCategoryLabel[ind].type; }
  		string GetCategoryLabelID(const size_t& ind) { return m_VectCategoryLabel[ind].id; }
  		string GetCategoryLabelTitle(const size_t& ind) { return m_VectCategoryLabel[ind].title; }
  		string GetCategoryLabelDesc(const size_t& ind) { return m_VectCategoryLabel[ind].desc; }
  	private:
          /**
           * The internal speech collection
           */
          vector<Speech*> speeches;
          /**
           * Store if the set is a reference set
           */
          bool ref;
          /**
           * Store if the set is a hypothesis set
           */
          bool hyp;
          
          bool gen;
          /**
           * Reference to the logger
           */
          static Logger* logger;
  		
  		/** The name of the file from which this SpeechSet originated. */
  		string fileName;
  		string titleName;
  		
  		/** Category/Label information (only for stm) */
  		vector<stcCategoryLabel> m_VectCategoryLabel;
  		
  		/** Caches the value of the "align.case_sensitive" property. */
  		bool case_sensitive;
  		/** Caches the value of the "align.fragment_are_correct" property. */
  		bool fragments_are_correct;
  		/** Caches the values of the "align.optionally" property. */
  		bool optionally_deletable;		
  		/** Updates the cached properties if needed. */
  		void UpdatePropertiesIfNeeded(const bool& force);
  };
  
  #endif // SPEECHSET_H