#region Using Directives
using System;
using System.Collections.Generic;
#endregion
/*
* $author: QmQ
* $source: http://www.rntsoft.com/useritems/SimpleStringTokenizer.asp
* $date: 10-June-2006
*/
namespace CBRSystem.Data
{
#region [Summary and remarks]
///
/// Implements a StringTokenizer class for splitting a string
/// into substrings using a set of delimiters.
///
///
/// C# version of the java.util.StringTokenizer class.
/// Basicly it's a wrapper class around the String.Split method.
/// It implements all of it's Java equivalent methods apart from those only needed by the Enumeration interface.
/// All implemented Java-compilant methods have their C# equivalents in properties. They however differ in names
/// since Java uses the (Hungarian-like) notation runMe() while C# uses Camel-cased RunMe() and thus
/// Java's nextToken() method is just an alias of the NextToken property.
///
#endregion
public class StringTokenizer : IEnumerable
{
///
/// String conatining the default set of delimiters which are " \t\n\r\f" :
/// the space character, the tab character, the newline character, the carriage-return character, and the form-feed character.
///
public const string DefaultDelimiters = " \t\n\r\f";
private readonly string delims = DefaultDelimiters;
private string[] tokens = null;
private int index = 0;
private string empty = String.Empty;
#region [Constructors]
///
/// Constructs a string tokenizer for the specified string using the default delimiters .
///
/// The string to be tokenized.
/// Thrown when the passed string is null
public StringTokenizer(string str)
{
Tokenize(str, false, false);
}
///
/// Constructs a string tokenizer for the specified string using the given delimiters.
///
/// The string to be tokenized.
/// The delimiters used to tokenize the string (each will be used as a delimiter).
/// Thrown when the passed string is null
public StringTokenizer(string str, string delims)
{
if(delims!=null) this.delims = delims;
Tokenize(str, false, false);
}
///
/// Constructs a string tokenizer for the specified string using the given delimiters.
///
/// The string to be tokenized.
/// The delimiters used to tokenize the string.
public StringTokenizer(string str, params char[] delims)
{
if (delims != null) this.delims = new string(delims);
Tokenize(str, false, false);
}
///
/// Constructs a string tokenizer for the specified string using the given delimiters and optionally returning them as tokens.
///
/// The string to be tokenized.
/// The delimiters used to tokenize the string (each will be used as a delimiter).
/// If set to true the encountered delimiters will also be returned as tokens.
/// Thrown when the passed string is null
public StringTokenizer(string str, string delims, bool returnDelims)
{
if (delims != null) this.delims = delims;
Tokenize(str, returnDelims, false);
}
///
/// Constructs a string tokenizer for the specified string using the given delimiters,
/// optionally returning them as tokens. Also empty tokens may be returned using the string.
///
/// The string to be tokenized.
/// The delimiters used to tokenize the string (each will be used as a delimiter).
/// If set to true the encountered delimiters will also be returned as tokens.
/// If set to true empty tokens will also be returned.
/// Thrown when the passed string is null
public StringTokenizer(string str, string delims, bool returnDelims, bool returnEmpty)
{
if (delims != null) this.delims = delims;
Tokenize(str, returnDelims, returnEmpty);
}
///
/// Constructs a string tokenizer for the specified string using the given delimiters,
/// optionally returning them as tokens. Also empty tokens may be returned using the string.
///
/// The string to be tokenized.
/// The delimiters used to tokenize the string (each will be used as a delimiter).
/// If set to true the encountered delimiters will also be returned as tokens.
/// If set to true empty tokens will also be returned.
/// The string to be returned as an empty token.
/// Thrown when the passed string is null
public StringTokenizer(string str, string delims, bool returnDelims, bool returnEmpty, string empty)
{
if (delims != null) this.delims = delims;
this.empty = empty;
Tokenize(str, returnDelims, returnEmpty);
}
#endregion
#region [The big tokenization method]
private void Tokenize(string str, bool returnDelims, bool returnEmpty)
{
if(returnDelims)
{
this.tokens = str.Split(this.delims.ToCharArray(), StringSplitOptions.RemoveEmptyEntries);
List tmp = new List(tokens.Length << 1);
int delimIndex = str.IndexOfAny(this.delims.ToCharArray());
int tokensIndex = 0;
int prevDelimIdx = delimIndex-1;
if (delimIndex == 0)
do
{
tmp.Add(new string(str[delimIndex], 1));
prevDelimIdx = delimIndex++;
delimIndex = str.IndexOfAny(this.delims.ToCharArray(), delimIndex);
if (returnEmpty && delimIndex == prevDelimIdx + 1)
tmp.Add(this.empty);
} while (delimIndex == prevDelimIdx + 1);
while (delimIndex > -1)
{
tmp.Add(this.tokens[tokensIndex++]);
do
{
tmp.Add(new string(str[delimIndex], 1));
prevDelimIdx = delimIndex++;
delimIndex = str.IndexOfAny(this.delims.ToCharArray(), delimIndex);
if (returnEmpty && delimIndex == prevDelimIdx + 1)
tmp.Add(this.empty);
} while (delimIndex == prevDelimIdx + 1);
}
if (tokensIndex < tokens.Length)
tmp.Add(this.tokens[tokensIndex++]);
this.tokens = tmp.ToArray();
tmp = null;
}
else if (returnEmpty)
{
this.tokens = str.Split(this.delims.ToCharArray(), StringSplitOptions.None);
if (this.empty != String.Empty)
for(int i=0; i if (this.tokens[i] == String.Empty) this.tokens[i] = this.empty;
}
else
this.tokens = str.Split(this.delims.ToCharArray(), StringSplitOptions.RemoveEmptyEntries);
}
#endregion
#region [Properties covering Java methods]
///
/// Tests if there are more tokens available from this tokenizer's string.
/// If this method returns true , then a subsequent
/// use of the property will successfully return a token.
///
///
/// true if more tokens are available; otherwise false .
///
public bool HasMoreTokens
{
get { return this.index < this.tokens.Length; }
}
///
/// Gets the next token.
///
/// The next token.
/// Thrown when trying to get a token which doesn't exist.
/// Usually caused by not checking if the property returns true before trying to get the next token.
public string NextToken
{
get { return this.tokens[index++]; }
}
///
/// Counts the tokens - the number of times the
/// property can be used before it throws an exception.
///
/// The number of remaining tokens.
///
public int CountTokens
{
get { return this.tokens.Length - this.index; }
}
#endregion
#region [New methods/properties]
///
/// Gets the total number of tokens extracted.
///
///
///
/// This property returns the total number of extracted tokens,
/// contrary to .
///
/// The number of tokens extracted.
///
public int Count
{
get { return this.tokens.Length; }
}
///
/// Gets the token with the specified index from the tokenizer without moving the current position index.
///
///
/// The index of the token to get.
/// The token with the given index
/// Thrown when trying to get a token which doesn't exist, that is when is equal or greater then or is negative.
public string this[int index]
{
get { return this.tokens[index]; }
}
///
/// Resets the current position index so that the tokens can be extracted again.
///
///
public void Reset()
{
this.index = 0;
}
///
/// Gets the currently set string for empty tokens.
///
/// Default is System.String.Empty
/// The empty token string.
public string EmptyString
{
get { return this.empty; }
}
#endregion
#region [Java-compilant methods]
/*
///
/// Tests if there are more tokens available from this tokenizer's string.
/// If this method returns true , then a subsequent call to will successfully return a token.
///
///
/// true if and only if there is at least one token in the string after the current position; otherwise false .
///
///
public bool hasMoreTokens()
{
return HasMoreTokens;
}
///
/// Returns the next token from this string tokenizer.
///
/// The next token from this string tokenizer.
public string nextToken()
{
return NextToken;
}
///
/// Calculates the number of times that this tokenizer's method can be called before it generates an exception. The current position is not advanced.
///
/// The number of tokens remaining in the string using the current delimiter set.
public int countTokens()
{
return CountTokens;
}
*/
#endregion
#region [IEnumerable implementation]
///
/// Returns an enumerator that iterates through the collection.
///
///
/// A that can be used to iterate through the collection.
///
public IEnumerator GetEnumerator()
{
while (this.HasMoreTokens)
yield return this.NextToken;
}
System.Collections.IEnumerator System.Collections.IEnumerable.GetEnumerator()
{
return GetEnumerator();
}
#endregion
}
}