summaryrefslogtreecommitdiff
path: root/tnet_io/KaldiLib/Tokenizer.cc
diff options
context:
space:
mode:
authorDeterminant <[email protected]>2015-06-25 12:56:45 +0800
committerDeterminant <[email protected]>2015-06-25 12:56:45 +0800
commita74183ddb4ab8383bfe214b3745eb8a0a99ee47a (patch)
treed5e69cf8c4c2db2e3a4722778352fc3c95953bb2 /tnet_io/KaldiLib/Tokenizer.cc
parentb6301089cde20f4c825c7f5deaf179082aad63da (diff)
let HTK I/O implementation be a single package
Diffstat (limited to 'tnet_io/KaldiLib/Tokenizer.cc')
-rw-r--r--tnet_io/KaldiLib/Tokenizer.cc53
1 files changed, 0 insertions, 53 deletions
diff --git a/tnet_io/KaldiLib/Tokenizer.cc b/tnet_io/KaldiLib/Tokenizer.cc
deleted file mode 100644
index 0c49050..0000000
--- a/tnet_io/KaldiLib/Tokenizer.cc
+++ /dev/null
@@ -1,53 +0,0 @@
-#include "Tokenizer.h"
-#include "string.h"
-
-namespace TNet
-{
- //****************************************************************************
- //****************************************************************************
- void
- Tokenizer::
- AddString(const char* pString)
- {
- // copy into string struct, which is more convenient
- std::string aux_string(pString);
- std::string aux_record;
- std::string::size_type cur_pos = 0;
- std::string::size_type old_pos = 0;
- std::string::size_type search_start = 0;
-
- // make sure we have enough space
- aux_record.reserve(aux_string.length());
-
- // find all of separators and make a list of tokens
- while(old_pos < std::string::npos) {
- // find the next separator
- cur_pos = aux_string.find_first_of(mSeparator, search_start);
-
- // if backslash is in front of separator, ignore this separator
- if (cur_pos != 0 && cur_pos != std::string::npos &&
- pString[cur_pos - 1] == '\\') {
- search_start = cur_pos + 1;
- continue;
- }
-
- // we don't want to have empty records
- if (!(cur_pos == old_pos && mSkipEmpty)) {
- // extract token
- aux_record.insert(0, pString+old_pos, cur_pos==std::string::npos ? strlen(pString+old_pos) : cur_pos - old_pos);
- // insert to list
- this->push_back(aux_record);
-
- // we don't need the contents of the token
- aux_record.erase();
- }
-
- // update old position so that it points behind the separator
- old_pos = cur_pos < std::string::npos ? cur_pos + 1 : cur_pos;
- search_start = old_pos;
- }
- }
-
-
-} // namespace TNet
-