Blame view
tools/sctk-2.4.10/src/asclite/core/speechset.h
4.22 KB
8dcb6dfcb first commit |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 |
/* * ASCLITE * Author: Jerome Ajot, Jon Fiscus, Nicolas Radde, Chris Laprun * * This software was developed at the National Institute of Standards and Technology by * employees of the Federal Government in the course of their official duties. Pursuant * to title 17 Section 105 of the United States Code this software is not subject to * copyright protection and is in the public domain. ASCLITE is an experimental system. * NIST assumes no responsibility whatsoever for its use by other parties, and makes no * guarantees, expressed or implied, about its quality, reliability, or any other * characteristic. We would appreciate acknowledgement if the software is used. * * THIS SOFTWARE IS PROVIDED "AS IS." With regard to this software, NIST MAKES NO EXPRESS * OR IMPLIED WARRANTY AS TO ANY MATTER WHATSOEVER, INCLUDING MERCHANTABILITY, * OR FITNESS FOR A PARTICULAR PURPOSE. */ #ifndef SPEECHSET_H #define SPEECHSET_H #include "stdinc.h" #include "speech.h" #include "logger.h" typedef struct CATEGORYLABEL { string type, id, title, desc; } stcCategoryLabel; /** * A speech set represent all the data from one source (reference, participant) * it's a collection of Speech(Speaker) from one source. */ class SpeechSet { public: // class constructors SpeechSet(const string& sourceFileName = "DEFAULT_FILE_NAME"); // class destructor ~SpeechSet(); /** * Return the nb of Speech contain in this set */ size_t GetNumberOfSpeech() { return speeches.size(); } /** * Return the speech number i in the set */ Speech* GetSpeech(const size_t& index) { return speeches[index]; } /** * Add a speech into the set */ void AddSpeech(Speech* speech) { speeches.push_back(speech); } /** * Return true id the set contain only references */ bool IsRef() { return ref; } /** * Return true id the set contain only hypothesis */ bool IsHyp() { return hyp; } bool IsGen() { return gen; } /** * Set the hyp/ref status of this set */ void SetOrigin(const string& status); /** Determines if case is taken into account to align Tokens part of this Speech. */ bool PerformCaseSensitiveAlignment(); /** Determines if fragments are considered as correct when aligning Tokens part of this Speech. */ bool AreFragmentsCorrect(); /** Determines if optionally deletable Tokens need to be accounted for. */ bool UseOptionallyDeletable(); /** Retrieves the name of the file from which this SpeechSet originated. */ string GetSourceFileName() { return fileName; } bool HasInterSegmentGap(); int GetMinTokensTime(); int GetMaxTokensTime(); void SetTitle(const string& title) { titleName = title; } string GetTitle() { return titleName; } void AddLabelCategory(const string& type, const string& id, const string& title, const string& desc); size_t GetNumberCategoryLabel() { return m_VectCategoryLabel.size(); } string GetCategoryLabelType(const size_t& ind) { return m_VectCategoryLabel[ind].type; } string GetCategoryLabelID(const size_t& ind) { return m_VectCategoryLabel[ind].id; } string GetCategoryLabelTitle(const size_t& ind) { return m_VectCategoryLabel[ind].title; } string GetCategoryLabelDesc(const size_t& ind) { return m_VectCategoryLabel[ind].desc; } private: /** * The internal speech collection */ vector<Speech*> speeches; /** * Store if the set is a reference set */ bool ref; /** * Store if the set is a hypothesis set */ bool hyp; bool gen; /** * Reference to the logger */ static Logger* logger; /** The name of the file from which this SpeechSet originated. */ string fileName; string titleName; /** Category/Label information (only for stm) */ vector<stcCategoryLabel> m_VectCategoryLabel; /** Caches the value of the "align.case_sensitive" property. */ bool case_sensitive; /** Caches the value of the "align.fragment_are_correct" property. */ bool fragments_are_correct; /** Caches the values of the "align.optionally" property. */ bool optionally_deletable; /** Updates the cached properties if needed. */ void UpdatePropertiesIfNeeded(const bool& force); }; #endif // SPEECHSET_H |