fix tokenize
base/str.cc: Fix tokenize so that it doesn't behave incorrectly when there are empty strings. test/tokentest.cc: Clean up the test function so it's easier to see what's going on --HG-- extra : convert_revision : c7a3db7bc516d3575b1cc4ab7afbd0f1fbe1ec6f
This commit is contained in:
parent
11894d3b4b
commit
c95e1281fc
2 changed files with 50 additions and 37 deletions
23
base/str.cc
23
base/str.cc
|
@ -26,11 +26,10 @@
|
||||||
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
#include <iostream>
|
|
||||||
|
|
||||||
#include <string.h>
|
|
||||||
#include <ctype.h>
|
#include <ctype.h>
|
||||||
|
|
||||||
|
#include <cstring>
|
||||||
|
#include <iostream>
|
||||||
#include <string>
|
#include <string>
|
||||||
#include <vector>
|
#include <vector>
|
||||||
|
|
||||||
|
@ -75,15 +74,17 @@ tokenize(vector<string>& v, const string &s, char token, bool ignore)
|
||||||
string::size_type first = 0;
|
string::size_type first = 0;
|
||||||
string::size_type last = s.find_first_of(token);
|
string::size_type last = s.find_first_of(token);
|
||||||
|
|
||||||
if (ignore) {
|
if (s.empty())
|
||||||
if (last == first) {
|
return;
|
||||||
while (last == first)
|
|
||||||
last = s.find_first_of(token, ++first);
|
|
||||||
|
|
||||||
if (last == string::npos) {
|
if (ignore && last == first) {
|
||||||
v.push_back(s);
|
while (last == first)
|
||||||
return;
|
last = s.find_first_of(token, ++first);
|
||||||
}
|
|
||||||
|
if (last == string::npos) {
|
||||||
|
if (first != s.size())
|
||||||
|
v.push_back(s.substr(first));
|
||||||
|
return;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -26,7 +26,7 @@
|
||||||
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
#include <iostream.h>
|
#include <iostream>
|
||||||
#include <string>
|
#include <string>
|
||||||
#include <vector>
|
#include <vector>
|
||||||
|
|
||||||
|
@ -35,35 +35,47 @@
|
||||||
int
|
int
|
||||||
main(int argc, char *argv[])
|
main(int argc, char *argv[])
|
||||||
{
|
{
|
||||||
if (argc != 3) {
|
using namespace std;
|
||||||
cout << "Usage: " << argv[0] << " <string> <token>\n";
|
|
||||||
exit(1);
|
|
||||||
}
|
|
||||||
|
|
||||||
int i;
|
if (argc != 3) {
|
||||||
string test = argv[1];
|
cout << "Usage: " << argv[0] << " <string> <token>\n";
|
||||||
vector<string> tokens1;
|
exit(1);
|
||||||
vector<string> tokens2;
|
}
|
||||||
char token = argv[2][0];
|
|
||||||
|
|
||||||
cout << "string = \"" << test << "\", token = \'" << token << "\'\n";
|
int i;
|
||||||
cout << "testing without ignore\n";
|
string test = argv[1];
|
||||||
tokenize(tokens1, test, token, false);
|
vector<string> tokens1;
|
||||||
|
vector<string> tokens2;
|
||||||
|
char token = argv[2][0];
|
||||||
|
|
||||||
if (tokens1.size()) {
|
cout << "string = \"" << test << "\", token = \'" << token << "\'\n";
|
||||||
for (i = 0; i < tokens1.size() - 1; i++)
|
cout << "testing without ignore\n";
|
||||||
cout << tokens1[i] << "(" << tokens1[i].size() << "), ";
|
tokenize(tokens1, test, token, false);
|
||||||
cout << tokens1[i] << "(" << tokens1[i].size() << ")\n";
|
|
||||||
}
|
|
||||||
|
|
||||||
cout << "testing with ignore\n";
|
if (tokens1.size()) {
|
||||||
tokenize(tokens2, test, token, true);
|
int size = tokens1.size();
|
||||||
|
cout << "size = " << size << "\n";
|
||||||
|
for (i = 0; i < size; i++) {
|
||||||
|
cout << "'" << tokens1[i] << "' (" << tokens1[i].size()
|
||||||
|
<< ")" << ((i == size - 1) ? "\n" : ", ");
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
cout << "no tokens" << endl;
|
||||||
|
}
|
||||||
|
|
||||||
if (tokens2.size()) {
|
cout << "testing with ignore\n";
|
||||||
for (i = 0; i < tokens2.size() - 1; i++)
|
tokenize(tokens2, test, token, true);
|
||||||
cout << tokens2[i] << "(" << tokens2[i].size() << "), ";
|
|
||||||
cout << tokens2[i] << "(" << tokens2[i].size() << ")\n";
|
|
||||||
}
|
|
||||||
|
|
||||||
return 0;
|
if (tokens2.size()) {
|
||||||
|
int size = tokens2.size();
|
||||||
|
cout << "size = " << size << "\n";
|
||||||
|
for (i = 0; i < size; i++) {
|
||||||
|
cout << "'" << tokens2[i] << "' (" << tokens2[i].size()
|
||||||
|
<< ")" << ((i == size - 1) ? "\n" : ", ");
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
cout << "no tokens" << endl;
|
||||||
|
}
|
||||||
|
|
||||||
|
return 0;
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in a new issue