// bin/copy-vector.cc // Copyright 2009-2012 Microsoft Corporation // 2012-2014 Johns Hopkins University (Author: Daniel Povey) // See ../../COPYING for clarification regarding multiple authors // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE, // MERCHANTABLITY OR NON-INFRINGEMENT. // See the Apache 2 License for the specific language governing permissions and // limitations under the License. #include "base/kaldi-common.h" #include "util/common-utils.h" #include "matrix/kaldi-vector.h" #include "transform/transform-common.h" int main(int argc, char *argv[]) { try { using namespace kaldi; const char *usage = "Copy vectors, or archives of vectors (e.g. transition-accs; speaker vectors)\n" "\n" "Usage: copy-vector [options] (|) (|)\n" " e.g.: copy-vector --binary=false 1.mat -\n" " copy-vector ark:2.trans ark,t:-\n" "see also: dot-weights, append-vector-to-feats\n"; bool binary = true; int32 change_dim = -1; float scale = 1.0; ParseOptions po(usage); po.Register("binary", &binary, "Write in binary mode (only " "relevant if output is a wxfilename)"); po.Register("change_dim", &change_dim, "Use this option to truncate or zero-pad the vectors."); po.Register("scale", &scale, "This option can be used to scale the vectors being copied."); po.Read(argc, argv); if (po.NumArgs() != 2) { po.PrintUsage(); exit(1); } std::string vector_in_fn = po.GetArg(1), vector_out_fn = po.GetArg(2); // all these "fn"'s are either rspecifiers or filenames. bool in_is_rspecifier = (ClassifyRspecifier(vector_in_fn, NULL, NULL) != kNoRspecifier), out_is_wspecifier = (ClassifyWspecifier(vector_out_fn, NULL, NULL, NULL) != kNoWspecifier); if (in_is_rspecifier != out_is_wspecifier) KALDI_ERR << "Cannot mix archives with regular files (copying vectors)"; if (!in_is_rspecifier) { Vector vec; ReadKaldiObject(vector_in_fn, &vec); Output ko(vector_out_fn, binary); if (change_dim >= 0) vec.Resize(change_dim, kCopyData); vec.Write(ko.Stream(), binary); KALDI_LOG << "Copied vector to " << vector_out_fn; return 0; } else { int num_done = 0; BaseFloatVectorWriter writer(vector_out_fn); SequentialBaseFloatVectorReader reader(vector_in_fn); if (change_dim < 0 && scale == 1.0) { for (; !reader.Done(); reader.Next(), num_done++) { writer.Write(reader.Key(), reader.Value()); } KALDI_LOG << "Copied " << num_done << " vectors."; } else { for (; !reader.Done(); reader.Next(), num_done++) { Vector vec(reader.Value()); if (change_dim >= 0) vec.Resize(change_dim, kCopyData); if (scale != 1.0) vec.Scale(scale); writer.Write(reader.Key(), reader.Value()); } KALDI_LOG << "Copied " << num_done << " vectors, setting dim to " << change_dim << " scaled by " << scale; } return (num_done != 0 ? 0 : 1); } } catch(const std::exception &e) { std::cerr << e.what(); return -1; } }