speechset.h 4.22 KB
edit raw blame history



1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

61

62

63

64

65

66

67

68

69

70

71

72

73

74

75

76

77

78

79

80

81

82

83

84

85

86

87

88

89

90

91

92

93

94

95

96

97

98

99

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128


/*
 * ASCLITE
 * Author: Jerome Ajot, Jon Fiscus, Nicolas Radde, Chris Laprun
 *
 * This software was developed at the National Institute of Standards and Technology by 
 * employees of the Federal Government in the course of their official duties. Pursuant
 * to title 17 Section 105 of the United States Code this software is not subject to
 * copyright protection and is in the public domain. ASCLITE is an experimental system.
 * NIST assumes no responsibility whatsoever for its use by other parties, and makes no
 * guarantees, expressed or implied, about its quality, reliability, or any other
 * characteristic. We would appreciate acknowledgement if the software is used.
 *
 * THIS SOFTWARE IS PROVIDED "AS IS."  With regard to this software, NIST MAKES NO EXPRESS
 * OR IMPLIED WARRANTY AS TO ANY MATTER WHATSOEVER, INCLUDING MERCHANTABILITY,
 * OR FITNESS FOR A PARTICULAR PURPOSE.
 */

#ifndef SPEECHSET_H
#define SPEECHSET_H

#include "stdinc.h"
#include "speech.h"
#include "logger.h"

typedef struct CATEGORYLABEL
{
	string type, id, title, desc;
} stcCategoryLabel;

/**
 * A speech set represent all the data from one source (reference, participant)
 * it's a collection of Speech(Speaker) from one source.
 */
class SpeechSet
{
	public:
		// class constructors
		SpeechSet(const string& sourceFileName = "DEFAULT_FILE_NAME");
		// class destructor
		~SpeechSet();
		/**
		 * Return the nb of Speech contain in this set
		 */
		size_t GetNumberOfSpeech() { return speeches.size(); }
		/**
		 * Return the speech number i in the set
		 */
		Speech* GetSpeech(const size_t& index) {  return speeches[index]; }
		/**
		 * Add a speech into the set
		 */
		void AddSpeech(Speech* speech) { speeches.push_back(speech); }
		/**
		 * Return true id the set contain only references
		 */
		bool IsRef() { return ref; }
		/**
		 * Return true id the set contain only hypothesis
		 */
		bool IsHyp() { return hyp; }
		bool IsGen() { return gen; }
		/**
		 * Set the hyp/ref status of this set
		 */
		void SetOrigin(const string& status);
		/** Determines if case is taken into account to align Tokens part of this Speech. */
		bool PerformCaseSensitiveAlignment();
		/** Determines if fragments are considered as correct when aligning Tokens part of this Speech. */
		bool AreFragmentsCorrect();
		/** Determines if optionally deletable Tokens need to be accounted for. */
		bool UseOptionallyDeletable();
		
		/** Retrieves the name of the file from which this SpeechSet originated. */
		string GetSourceFileName() { return fileName; }
		
		bool HasInterSegmentGap();
		
		int GetMinTokensTime();
		int GetMaxTokensTime();
		
		void SetTitle(const string& title) { titleName = title; }
		string GetTitle() { return titleName; }
		
		void AddLabelCategory(const string& type, const string& id, const string& title, const string& desc);
		
		size_t GetNumberCategoryLabel() { return m_VectCategoryLabel.size(); }
		string GetCategoryLabelType(const size_t& ind) { return m_VectCategoryLabel[ind].type; }
		string GetCategoryLabelID(const size_t& ind) { return m_VectCategoryLabel[ind].id; }
		string GetCategoryLabelTitle(const size_t& ind) { return m_VectCategoryLabel[ind].title; }
		string GetCategoryLabelDesc(const size_t& ind) { return m_VectCategoryLabel[ind].desc; }
	private:
        /**
         * The internal speech collection
         */
        vector<Speech*> speeches;
        /**
         * Store if the set is a reference set
         */
        bool ref;
        /**
         * Store if the set is a hypothesis set
         */
        bool hyp;
        
        bool gen;
        /**
         * Reference to the logger
         */
        static Logger* logger;
		
		/** The name of the file from which this SpeechSet originated. */
		string fileName;
		string titleName;
		
		/** Category/Label information (only for stm) */
		vector<stcCategoryLabel> m_VectCategoryLabel;
		
		/** Caches the value of the "align.case_sensitive" property. */
		bool case_sensitive;
		/** Caches the value of the "align.fragment_are_correct" property. */
		bool fragments_are_correct;
		/** Caches the values of the "align.optionally" property. */
		bool optionally_deletable;		
		/** Updates the cached properties if needed. */
		void UpdatePropertiesIfNeeded(const bool& force);
};

#endif // SPEECHSET_H