You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
PaddleSpeech/runtime/engine/kaldi/util/kaldi-io.h

281 lines
10 KiB

// util/kaldi-io.h
// Copyright 2009-2011 Microsoft Corporation; Jan Silovsky
// 2016 Xiaohui Zhang
// See ../../COPYING for clarification regarding multiple authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
// http://www.apache.org/licenses/LICENSE-2.0
// THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
// WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
// MERCHANTABLITY OR NON-INFRINGEMENT.
// See the Apache 2 License for the specific language governing permissions and
// limitations under the License.
#ifndef KALDI_UTIL_KALDI_IO_H_
#define KALDI_UTIL_KALDI_IO_H_
#ifdef _MSC_VER
# include <fcntl.h>
# include <io.h>
#endif
#include <cctype> // For isspace.
#include <limits>
#include <string>
#include "base/kaldi-common.h"
#include "matrix/kaldi-matrix.h"
namespace kaldi {
class OutputImplBase; // Forward decl; defined in a .cc file
class InputImplBase; // Forward decl; defined in a .cc file
/// \addtogroup io_group
/// @{
// The Output and Input classes handle stream-opening for "extended" filenames
// that include actual files, standard-input/standard-output, pipes, and
// offsets into actual files. They also handle reading and writing the
// binary-mode headers for Kaldi files, where applicable. The classes have
// versions of the Open routines that throw and do not throw, depending whether
// the calling code wants to catch the errors or not; there are also versions
// that write (or do not write) the Kaldi binary-mode header that says if it's
// binary mode. Generally files that contain Kaldi objects will have the header
// on, so we know upon reading them whether they have the header. So you would
// use the OpenWithHeader routines for these (or the constructor); but other
// types of objects (e.g. FSTs) would have files without a header so you would
// use OpenNoHeader.
// We now document the types of extended filenames that we use.
//
// A "wxfilename" is an extended filename for writing. It can take three forms:
// (1) Filename: e.g. "/some/filename", "./a/b/c", "c:\Users\dpovey\My
// Documents\\boo"
// (whatever the actual file-system interprets)
// (2) Standard output: "" or "-"
// (3) A pipe: e.g. "| gzip -c > /tmp/abc.gz"
//
//
// A "rxfilename" is an extended filename for reading. It can take four forms:
// (1) An actual filename, whatever the file-system can read, e.g. "/my/file".
// (2) Standard input: "" or "-"
// (3) A pipe: e.g. "gunzip -c /tmp/abc.gz |"
// (4) An offset into a file, e.g.: "/mnt/blah/data/1.ark:24871"
// [these are created by the Table and TableWriter classes; I may also write
// a program that creates them for arbitrary files]
//
// Typical usage:
// ...
// bool binary;
// MyObject.Write(Output(some_filename, binary).Stream(), binary);
//
// ... more extensive example:
// {
// Output ko(some_filename, binary);
// MyObject1.Write(ko.Stream(), binary);
// MyObject2.Write(ko.Stream(), binary);
// }
enum OutputType {
kNoOutput,
kFileOutput,
kStandardOutput,
kPipeOutput
};
/// ClassifyWxfilename interprets filenames as follows:
/// - kNoOutput: invalid filenames (leading or trailing space, things that look
/// like wspecifiers and rspecifiers or like pipes to read from with leading
/// |.
/// - kFileOutput: Normal filenames
/// - kStandardOutput: The empty string or "-", interpreted as standard output
/// - kPipeOutput: pipes, e.g. "| gzip -c > /tmp/abc.gz"
OutputType ClassifyWxfilename(const std::string &wxfilename);
enum InputType {
kNoInput,
kFileInput,
kStandardInput,
kOffsetFileInput,
kPipeInput
};
/// ClassifyRxfilenames interprets filenames for reading as follows:
/// - kNoInput: invalid filenames (leading or trailing space, things that
/// look like wspecifiers and rspecifiers or pipes to write to
/// with trailing |.
/// - kFileInput: normal filenames
/// - kStandardInput: the empty string or "-"
/// - kPipeInput: e.g. "gunzip -c /tmp/abc.gz |"
/// - kOffsetFileInput: offsets into files, e.g. /some/filename:12970
InputType ClassifyRxfilename(const std::string &rxfilename);
class Output {
public:
// The normal constructor, provided for convenience.
// Equivalent to calling with default constructor then Open()
// with these arguments.
Output(const std::string &filename, bool binary, bool write_header = true);
Output(): impl_(NULL) {}
/// This opens the stream, with the given mode (binary or text). It returns
/// true on success and false on failure. However, it will throw if something
/// was already open and could not be closed (to avoid this, call Close()
/// first. if write_header == true and binary == true, it writes the Kaldi
/// binary-mode header ('\0' then 'B'). You may call Open even if it is
/// already open; it will close the existing stream and reopen (however if
/// closing the old stream failed it will throw).
bool Open(const std::string &wxfilename, bool binary, bool write_header);
inline bool IsOpen(); // return true if we have an open stream. Does not
// imply stream is good for writing.
std::ostream &Stream(); // will throw if not open; else returns stream.
// Close closes the stream. Calling Close is never necessary unless you
// want to avoid exceptions being thrown. There are times when calling
// Close will hurt efficiency (basically, when using offsets into files,
// and using the same Input object),
// but most of the time the user won't be doing this directly, it will
// be done in kaldi-table.{h, cc}, so you don't have to worry about it.
bool Close();
// This will throw if stream could not be closed (to check error status,
// call Close()).
~Output();
private:
OutputImplBase *impl_; // non-NULL if open.
std::string filename_;
KALDI_DISALLOW_COPY_AND_ASSIGN(Output);
};
// bool binary_in;
// Input ki(some_filename, &binary_in);
// MyObject.Read(ki.Stream(), binary_in);
//
// ... more extensive example:
//
// {
// bool binary_in;
// Input ki(some_filename, &binary_in);
// MyObject1.Read(ki.Stream(), &binary_in);
// MyObject2.Write(ki.Stream(), &binary_in);
// }
// Note that to catch errors you need to use try.. catch.
// Input communicates errors by throwing exceptions.
// Input interprets four kinds of filenames:
// (1) Normal filenames
// (2) The empty string or "-", interpreted as standard output
// (3) A pipe: e.g. "gunzip -c /tmp/abc.gz |"
// (4) Offsets into [real] files, e.g. "/my/filename:12049"
// The last one has no correspondence in Output.
class Input {
public:
/// The normal constructor. Opens the stream in binary mode.
/// Equivalent to calling the default constructor followed by Open(); then, if
/// binary != NULL, it calls ReadHeader(), putting the output in "binary"; it
/// throws on error.
Input(const std::string &rxfilename, bool *contents_binary = NULL);
Input(): impl_(NULL) {}
// Open opens the stream for reading (the mode, where relevant, is binary; use
// OpenTextMode for text-mode, we made this a separate function rather than a
// boolean argument, to avoid confusion with Kaldi's text/binary distinction,
// since reading in the file system's text mode is unusual.) If
// contents_binary != NULL, it reads the binary-mode header and puts it in the
// "binary" variable. Returns true on success. If it returns false it will
// not be open. You may call Open even if it is already open; it will close
// the existing stream and reopen (however if closing the old stream failed it
// will throw).
inline bool Open(const std::string &rxfilename, bool *contents_binary = NULL);
// As Open but (if the file system has text/binary modes) opens in text mode;
// you shouldn't ever have to use this as in Kaldi we read even text files in
// binary mode (and ignore the \r).
inline bool OpenTextMode(const std::string &rxfilename);
// Return true if currently open for reading and Stream() will
// succeed. Does not guarantee that the stream is good.
inline bool IsOpen();
// It is never necessary or helpful to call Close, except if
// you are concerned about to many filehandles being open.
// Close does not throw. It returns the exit code as int32
// in the case of a pipe [kPipeInput], and always zero otherwise.
int32 Close();
// Returns the underlying stream. Throws if !IsOpen()
std::istream &Stream();
// Destructor does not throw: input streams may legitimately fail so we
// don't worry about the status when we close them.
~Input();
private:
bool OpenInternal(const std::string &rxfilename, bool file_binary,
bool *contents_binary);
InputImplBase *impl_;
KALDI_DISALLOW_COPY_AND_ASSIGN(Input);
};
template <class C> void ReadKaldiObject(const std::string &filename,
C *c) {
bool binary_in;
Input ki(filename, &binary_in);
c->Read(ki.Stream(), binary_in);
}
// Specialize the template for reading matrices, because we want to be able to
// support reading 'ranges' (row and column ranges), like foo.mat[10:20].
template <> void ReadKaldiObject(const std::string &filename,
Matrix<float> *m);
template <> void ReadKaldiObject(const std::string &filename,
Matrix<double> *m);
template <class C> inline void WriteKaldiObject(const C &c,
const std::string &filename,
bool binary) {
Output ko(filename, binary);
c.Write(ko.Stream(), binary);
}
/// PrintableRxfilename turns the rxfilename into a more human-readable
/// form for error reporting, i.e. it does quoting and escaping and
/// replaces "" or "-" with "standard input".
std::string PrintableRxfilename(const std::string &rxfilename);
/// PrintableWxfilename turns the wxfilename into a more human-readable
/// form for error reporting, i.e. it does quoting and escaping and
/// replaces "" or "-" with "standard output".
std::string PrintableWxfilename(const std::string &wxfilename);
/// @}
} // end namespace kaldi.
#include "util/kaldi-io-inl.h"
#endif // KALDI_UTIL_KALDI_IO_H_