Yannick Estève / ONTRAC-Kaldi

Blame view

tools/sctk-2.4.10/src/asclite/core/speech.cpp 5.95 KB
  /*
   * ASCLITE
   * Author: Jerome Ajot, Jon Fiscus, Nicolas Radde, Chris Laprun
   *
   * This software was developed at the National Institute of Standards and Technology by 
   * employees of the Federal Government in the course of their official duties. Pursuant
   * to title 17 Section 105 of the United States Code this software is not subject to
   * copyright protection and is in the public domain. ASCLITE is an experimental system.
   * NIST assumes no responsibility whatsoever for its use by other parties, and makes no
   * guarantees, expressed or implied, about its quality, reliability, or any other
   * characteristic. We would appreciate acknowledgement if the software is used.
   *
   * THIS SOFTWARE IS PROVIDED "AS IS."  With regard to this software, NIST MAKES NO EXPRESS
   * OR IMPLIED WARRANTY AS TO ANY MATTER WHATSOEVER, INCLUDING MERCHANTABILITY,
   * OR FITNESS FOR A PARTICULAR PURPOSE.
   */
   
  /**
   * Internal representation of an hypothesis file or a reference file.
   */
  
  #include "speech.h" // class's header file
  #include "speechset.h"
  
  Logger* Speech::m_pLogger = Logger::getLogger();
  
  // class constructor
  Speech::Speech() {}
  
  // class constructor
  Speech::Speech(SpeechSet* parent)
  {
  	parentSet = parent;
  }
  
  Speech::Speech(const vector<Segment *>& segments)
  {
  	m_segments = vector<Segment *>(segments);
  }
  
  // class destructor
  Speech::~Speech()
  {
  	for(size_t i=0; i<m_segments.size(); ++i)
  	{
  		Segment* ptr_elt = m_segments[i];
  		
  		if(ptr_elt)
  			delete ptr_elt;
  	}
  	
  	m_segments.clear();
  }
  
  bool Speech::PerformCaseSensitiveAlignment()
  {
  	return parentSet->PerformCaseSensitiveAlignment();
  }
  
  bool Speech::AreFragmentsCorrect()
  {
  	return parentSet->AreFragmentsCorrect();
  }
  
  bool Speech::UseOptionallyDeletable()
  {
  	return parentSet->UseOptionallyDeletable();
  }
  
  /**
   * Retrieves the SpeechSet in which this Speech is located 
   */
  SpeechSet* Speech::GetParentSpeechSet()
  {
    return parentSet;
  }
  
  /**
  * Return the next Segment starting at the specified time for
  * the specified source and channel. If the time is in the middle of
  * A segment return the segment itself.
  */
  Segment* Speech::NextSegment(const int& time, const string& source, const string& channel)
  {
  	int last_endTime = 0;	
  	
  	for (size_t i=0 ; i < m_segments.size() ; ++i)
  	{
          Segment *currentSegment = m_segments[i];
  		
  		if (currentSegment->GetSource() == source && currentSegment->GetChannel() == channel)
  		{
  			if (currentSegment->GetEndTime() > time && last_endTime <= time)
  			{
  				return currentSegment;
  			}
              
  			last_endTime = currentSegment->GetEndTime();
  		}
  	}
      
  	return NULL;
  }
  
  /**
   * Return the segments of this speech by the given time
   */
  vector<Segment*> Speech::GetSegmentsByTime(const int& start, const int& end, const string& source, const string& channel)
  {
  	vector<Segment*> res;
      
  	for (size_t i=0 ; i < m_segments.size() ; ++i)
  	{
  		Segment *currentSegment = m_segments[i];
  		if (currentSegment->GetSource() == source && currentSegment->GetChannel() == channel)
  		{
  			int s_mid = ((currentSegment->GetEndTime()+currentSegment->GetStartTime()) / 2);
              
  			if (s_mid >= start && s_mid < end)
  			{
  				res.push_back(currentSegment);
  			}
  		}
  	}
  	return res;
  }
  
  string Speech::ToString()
  {
  	std::ostringstream oss;
  	oss << "<Speech NbOfSegments='" << NbOfSegments() << "'>";
  	
  	for(size_t i = 0; i < NbOfSegments(); ++i)
      {
          Segment *seg = GetSegment(i);
          oss << seg->ToString() << endl;
      }	
  	oss << "</Speech>";
  	return oss.str();
  }
  
  void Speech::RemoveSegment(Segment* currentSegment)
  {	
  	list<Token*> listPreviousTokenofFirstToken;
  	list<Token*> listNextTokenofLastToken;
  		
  	// Remove links from the previous tokens of the first tokens of the segment
  	for(size_t f=0; f<currentSegment->GetNumberOfFirstToken(); ++f)
  	{
  		Token* firstToken = currentSegment->GetFirstToken(f);
  		
  		if(firstToken)
  		{
  			for(size_t p=0; p<firstToken->GetNbOfPrecTokens(); ++p)
  			{
  				Token* previousTokenofFirstToken = firstToken->GetPrecToken(p);
  				listPreviousTokenofFirstToken.push_back(previousTokenofFirstToken);
  				previousTokenofFirstToken->UnlinkNextToken(firstToken);
  			}
  		}
  	}
  	
  	// Remove links from the next tokens of the last tokens of the segment
  	for(size_t l=0; l<currentSegment->GetNumberOfLastToken(); ++l)
  	{
  		Token* lastToken = currentSegment->GetLastToken(l);
  		
  		if(lastToken)
  		{
  			for(size_t n=0; n<lastToken->GetNbOfNextTokens(); ++n)
  			{
  				Token* nextTokenofLastToken = lastToken->GetNextToken(n);
  				listNextTokenofLastToken.push_back(nextTokenofLastToken);
  				nextTokenofLastToken->UnlinkPrevToken(lastToken);
  			}
  		}
  	}
  		
  	// Re-attach the tokens
  	list<Token*>::iterator prev  = listPreviousTokenofFirstToken.begin();
  	list<Token*>::iterator eprev = listPreviousTokenofFirstToken.end();
  	list<Token*>::iterator next  = listNextTokenofLastToken.begin();
  	list<Token*>::iterator enext = listNextTokenofLastToken.end();
  	
  	while(prev != eprev)
  	{
  		while(next != enext)
  		{
  			(*prev)->AddNextToken(*next);
  			(*next)->AddPrecToken(*prev);
  			
  			++next;
  		}
  		
  		++prev;
  	}
      
      listPreviousTokenofFirstToken.clear();
      listNextTokenofLastToken.clear();
    	  	  
      // Remove Segment from vector
      vector<Segment*>::iterator SegIter = m_segments.begin();
      	
  	while (SegIter != m_segments.end() && (*SegIter) != currentSegment)
  		++SegIter;
  
  	if (SegIter == m_segments.end())
      {
  		LOG_FATAL(m_pLogger, "Speech::RemoveSegment(), the segment is not at the right spot!!");
  		exit(E_INVALID);
  	}
  	
  	m_segments.erase(SegIter);
      
      // destroy! the segment now
      delete currentSegment;
  }
  
  int Speech::GetMinTokensTime()
  {
  	int MinTime = -1;
  	
  	for(size_t spj=0; spj<NbOfSegments(); ++spj)
  	{
  		int tmpmin = GetSegment(spj)->GetMinTokensTime();
  		
  		if ( (MinTime == -1) || (tmpmin < MinTime) )
  			MinTime = tmpmin;
  	}
  	
  	return MinTime;
  }
  
  int Speech::GetMaxTokensTime()
  {
  	int MaxTime = -1;
  	
  	for(size_t spj=0; spj<NbOfSegments(); ++spj)
  	{
  		int tmpmax = GetSegment(spj)->GetMaxTokensTime();
  		
  		if ( (MaxTime == -1) || (tmpmax > MaxTime) )
  			MaxTime = tmpmax;
  	}
  	
  	return MaxTime;
  }