Skip to content

Commit

Permalink
fix: correct the split behavior during collecting dict entries (rime#762
Browse files Browse the repository at this point in the history
)
  • Loading branch information
WhiredPlanck committed Nov 26, 2023
1 parent bafe97f commit 5d19288
Show file tree
Hide file tree
Showing 3 changed files with 5 additions and 5 deletions.
6 changes: 3 additions & 3 deletions src/rime/algo/strings.cc
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@ vector<string> split(const string& str,
SplitBehavior behavior) {
vector<string> strings;
size_t lastPos, pos;
if (behavior == SplitBehavior::SkipEmpty) {
if (behavior == SplitBehavior::SkipToken) {
lastPos = str.find_first_not_of(delim, 0);
} else {
lastPos = 0;
Expand All @@ -17,7 +17,7 @@ vector<string> split(const string& str,

while (std::string::npos != pos || std::string::npos != lastPos) {
strings.emplace_back(str.substr(lastPos, pos - lastPos));
if (behavior == SplitBehavior::SkipEmpty) {
if (behavior == SplitBehavior::SkipToken) {
lastPos = str.find_first_not_of(delim, pos);
} else {
if (pos == std::string::npos) {
Expand All @@ -31,7 +31,7 @@ vector<string> split(const string& str,
};

vector<string> split(const string& str, const string& delim) {
return split(str, delim, SplitBehavior::SkipEmpty);
return split(str, delim, SplitBehavior::SkipToken);
};

} // namespace strings
Expand Down
2 changes: 1 addition & 1 deletion src/rime/algo/strings.h
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@
namespace rime {
namespace strings {

enum class SplitBehavior { KeepEmpty, SkipEmpty };
enum class SplitBehavior { KeepToken, SkipToken };

vector<string> split(const string& str,
const string& delim,
Expand Down
2 changes: 1 addition & 1 deletion src/rime/dict/entry_collector.cc
Original file line number Diff line number Diff line change
Expand Up @@ -87,7 +87,7 @@ void EntryCollector::Collect(const string& dict_file) {
continue;
}
// read a dict entry
auto row = strings::split(line, "\t");
auto row = strings::split(line, "\t", strings::SplitBehavior::KeepToken);
int num_columns = static_cast<int>(row.size());
if (num_columns <= text_column || row[text_column].empty()) {
LOG(WARNING) << "Missing entry text at #" << num_entries << ".";
Expand Down

0 comments on commit 5d19288

Please sign in to comment.