speechset.h
4.22 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
/*
* ASCLITE
* Author: Jerome Ajot, Jon Fiscus, Nicolas Radde, Chris Laprun
*
* This software was developed at the National Institute of Standards and Technology by
* employees of the Federal Government in the course of their official duties. Pursuant
* to title 17 Section 105 of the United States Code this software is not subject to
* copyright protection and is in the public domain. ASCLITE is an experimental system.
* NIST assumes no responsibility whatsoever for its use by other parties, and makes no
* guarantees, expressed or implied, about its quality, reliability, or any other
* characteristic. We would appreciate acknowledgement if the software is used.
*
* THIS SOFTWARE IS PROVIDED "AS IS." With regard to this software, NIST MAKES NO EXPRESS
* OR IMPLIED WARRANTY AS TO ANY MATTER WHATSOEVER, INCLUDING MERCHANTABILITY,
* OR FITNESS FOR A PARTICULAR PURPOSE.
*/
#ifndef SPEECHSET_H
#define SPEECHSET_H
#include "stdinc.h"
#include "speech.h"
#include "logger.h"
typedef struct CATEGORYLABEL
{
string type, id, title, desc;
} stcCategoryLabel;
/**
* A speech set represent all the data from one source (reference, participant)
* it's a collection of Speech(Speaker) from one source.
*/
class SpeechSet
{
public:
// class constructors
SpeechSet(const string& sourceFileName = "DEFAULT_FILE_NAME");
// class destructor
~SpeechSet();
/**
* Return the nb of Speech contain in this set
*/
size_t GetNumberOfSpeech() { return speeches.size(); }
/**
* Return the speech number i in the set
*/
Speech* GetSpeech(const size_t& index) { return speeches[index]; }
/**
* Add a speech into the set
*/
void AddSpeech(Speech* speech) { speeches.push_back(speech); }
/**
* Return true id the set contain only references
*/
bool IsRef() { return ref; }
/**
* Return true id the set contain only hypothesis
*/
bool IsHyp() { return hyp; }
bool IsGen() { return gen; }
/**
* Set the hyp/ref status of this set
*/
void SetOrigin(const string& status);
/** Determines if case is taken into account to align Tokens part of this Speech. */
bool PerformCaseSensitiveAlignment();
/** Determines if fragments are considered as correct when aligning Tokens part of this Speech. */
bool AreFragmentsCorrect();
/** Determines if optionally deletable Tokens need to be accounted for. */
bool UseOptionallyDeletable();
/** Retrieves the name of the file from which this SpeechSet originated. */
string GetSourceFileName() { return fileName; }
bool HasInterSegmentGap();
int GetMinTokensTime();
int GetMaxTokensTime();
void SetTitle(const string& title) { titleName = title; }
string GetTitle() { return titleName; }
void AddLabelCategory(const string& type, const string& id, const string& title, const string& desc);
size_t GetNumberCategoryLabel() { return m_VectCategoryLabel.size(); }
string GetCategoryLabelType(const size_t& ind) { return m_VectCategoryLabel[ind].type; }
string GetCategoryLabelID(const size_t& ind) { return m_VectCategoryLabel[ind].id; }
string GetCategoryLabelTitle(const size_t& ind) { return m_VectCategoryLabel[ind].title; }
string GetCategoryLabelDesc(const size_t& ind) { return m_VectCategoryLabel[ind].desc; }
private:
/**
* The internal speech collection
*/
vector<Speech*> speeches;
/**
* Store if the set is a reference set
*/
bool ref;
/**
* Store if the set is a hypothesis set
*/
bool hyp;
bool gen;
/**
* Reference to the logger
*/
static Logger* logger;
/** The name of the file from which this SpeechSet originated. */
string fileName;
string titleName;
/** Category/Label information (only for stm) */
vector<stcCategoryLabel> m_VectCategoryLabel;
/** Caches the value of the "align.case_sensitive" property. */
bool case_sensitive;
/** Caches the value of the "align.fragment_are_correct" property. */
bool fragments_are_correct;
/** Caches the values of the "align.optionally" property. */
bool optionally_deletable;
/** Updates the cached properties if needed. */
void UpdatePropertiesIfNeeded(const bool& force);
};
#endif // SPEECHSET_H