259 lines
9.2 KiB
C#
259 lines
9.2 KiB
C#
#region PDFsharp - A .NET library for processing PDF
|
|
//
|
|
// Authors:
|
|
// Microsoft
|
|
//
|
|
// Copyright (c) 2005-2017 empira Software GmbH, Cologne Area (Germany)
|
|
//
|
|
// http://www.pdfsharp.com
|
|
// http://sourceforge.net/projects/pdfsharp
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a
|
|
// copy of this software and associated documentation files (the "Software"),
|
|
// to deal in the Software without restriction, including without limitation
|
|
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
// and/or sell copies of the Software, and to permit persons to whom the
|
|
// Software is furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included
|
|
// in all copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
// THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
// FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
// DEALINGS IN THE SOFTWARE.
|
|
#endregion
|
|
|
|
using System;
|
|
using System.Globalization;
|
|
|
|
#if !EDF_CORE
|
|
namespace PdfSharp.Internal
|
|
#else
|
|
namespace Edf.Internal
|
|
#endif
|
|
{
|
|
// Reflected from WPF to ensure compatibility
|
|
// Use netmassdownloader -d "C:\Program Files (x86)\Reference Assemblies\Microsoft\Framework\v3.0" -output g:\cachetest -v
|
|
class TokenizerHelper
|
|
{
|
|
/// <summary>
|
|
/// Initializes a new instance of the <see cref="TokenizerHelper"/> class.
|
|
/// </summary>
|
|
public TokenizerHelper(string str, IFormatProvider formatProvider)
|
|
{
|
|
char numericListSeparator = GetNumericListSeparator(formatProvider);
|
|
Initialize(str, '\'', numericListSeparator);
|
|
}
|
|
|
|
/// <summary>
|
|
/// Initializes a new instance of the <see cref="TokenizerHelper"/> class.
|
|
/// </summary>
|
|
public TokenizerHelper(string str, char quoteChar, char separator)
|
|
{
|
|
Initialize(str, quoteChar, separator);
|
|
}
|
|
|
|
void Initialize(string str, char quoteChar, char separator)
|
|
{
|
|
_str = str;
|
|
_strLen = str == null ? 0 : str.Length;
|
|
_currentTokenIndex = -1;
|
|
_quoteChar = quoteChar;
|
|
_argSeparator = separator;
|
|
|
|
// Skip any whitespace.
|
|
while (_charIndex < _strLen)
|
|
{
|
|
if (!char.IsWhiteSpace(_str, _charIndex))
|
|
return;
|
|
_charIndex++;
|
|
}
|
|
}
|
|
|
|
public string NextTokenRequired()
|
|
{
|
|
if (!NextToken(false))
|
|
throw new InvalidOperationException("PrematureStringTermination"); //SR.Get(SRID.TokenizerHelperPrematureStringTermination, new object[0]));
|
|
return GetCurrentToken();
|
|
}
|
|
|
|
public string NextTokenRequired(bool allowQuotedToken)
|
|
{
|
|
if (!NextToken(allowQuotedToken))
|
|
throw new InvalidOperationException("PrematureStringTermination"); //SR.Get(SRID.TokenizerHelperPrematureStringTermination, new object[0]));
|
|
return GetCurrentToken();
|
|
}
|
|
|
|
public string GetCurrentToken()
|
|
{
|
|
if (_currentTokenIndex < 0)
|
|
return null;
|
|
return _str.Substring(_currentTokenIndex, _currentTokenLength);
|
|
}
|
|
|
|
public void LastTokenRequired()
|
|
{
|
|
if (_charIndex != _strLen)
|
|
throw new InvalidOperationException("Extra data encountered"); //SR.Get(SRID.TokenizerHelperExtraDataEncountered, new object[0]));
|
|
}
|
|
|
|
/// <summary>
|
|
/// Move to next token.
|
|
/// </summary>
|
|
public bool NextToken()
|
|
{
|
|
return NextToken(false);
|
|
}
|
|
|
|
/// <summary>
|
|
/// Move to next token.
|
|
/// </summary>
|
|
public bool NextToken(bool allowQuotedToken)
|
|
{
|
|
return NextToken(allowQuotedToken, _argSeparator);
|
|
}
|
|
|
|
public bool NextToken(bool allowQuotedToken, char separator)
|
|
{
|
|
// Reset index.
|
|
_currentTokenIndex = -1;
|
|
_foundSeparator = false;
|
|
|
|
// Already at the end of the string?
|
|
if (_charIndex >= _strLen)
|
|
return false;
|
|
|
|
char currentChar = _str[_charIndex];
|
|
|
|
// Setup the quoteCount .
|
|
int quoteCount = 0;
|
|
|
|
// If we are allowing a quoted token and this token begins with a quote,
|
|
// set up the quote count and skip the initial quote
|
|
if (allowQuotedToken &&
|
|
currentChar == _quoteChar)
|
|
{
|
|
quoteCount++;
|
|
_charIndex++;
|
|
}
|
|
|
|
int newTokenIndex = _charIndex;
|
|
int newTokenLength = 0;
|
|
|
|
// Loop until hit end of string or hit a separator or whitespace.
|
|
while (_charIndex < _strLen)
|
|
{
|
|
currentChar = _str[_charIndex];
|
|
|
|
// If have a quoteCount and this is a quote decrement the quoteCount.
|
|
if (quoteCount > 0)
|
|
{
|
|
// If anything but a quoteChar we move on.
|
|
if (currentChar == _quoteChar)
|
|
{
|
|
quoteCount--;
|
|
|
|
// If at zero which it always should for now break out of the loop.
|
|
if (quoteCount == 0)
|
|
{
|
|
++_charIndex;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
else if ((char.IsWhiteSpace(currentChar)) || (currentChar == separator))
|
|
{
|
|
if (currentChar == separator)
|
|
_foundSeparator = true;
|
|
break;
|
|
}
|
|
|
|
_charIndex++;
|
|
newTokenLength++;
|
|
}
|
|
|
|
// If quoteCount isn't zero we hit the end of the string before the ending quote.
|
|
if (quoteCount > 0)
|
|
throw new InvalidOperationException("Missing end quote"); //SR.Get(SRID.TokenizerHelperMissingEndQuote, new object[0]));
|
|
|
|
// Move at the start of the nextToken.
|
|
ScanToNextToken(separator);
|
|
|
|
// Update the _currentToken values.
|
|
_currentTokenIndex = newTokenIndex;
|
|
_currentTokenLength = newTokenLength;
|
|
|
|
if (_currentTokenLength < 1)
|
|
throw new InvalidOperationException("Empty token"); // SR.Get(SRID.TokenizerHelperEmptyToken, new object[0]));
|
|
|
|
return true;
|
|
}
|
|
|
|
private void ScanToNextToken(char separator)
|
|
{
|
|
// Do nothing if already at end of the string.
|
|
if (_charIndex < _strLen)
|
|
{
|
|
char currentChar = _str[_charIndex];
|
|
|
|
// Ensure that currentChar is a white space or separator.
|
|
if (currentChar != separator && !char.IsWhiteSpace(currentChar))
|
|
throw new InvalidOperationException("ExtraDataEncountered"); //SR.Get(SRID.TokenizerHelperExtraDataEncountered, new object[0]));
|
|
|
|
// Loop until a character that isn't the separator or white space.
|
|
int argSepCount = 0;
|
|
while (_charIndex < _strLen)
|
|
{
|
|
currentChar = _str[_charIndex];
|
|
if (currentChar == separator)
|
|
{
|
|
_foundSeparator = true;
|
|
argSepCount++;
|
|
_charIndex++;
|
|
|
|
if (argSepCount > 1)
|
|
throw new InvalidOperationException("EmptyToken"); //SR.Get(SRID.TokenizerHelperEmptyToken, new object[0]));
|
|
}
|
|
else if (char.IsWhiteSpace(currentChar))
|
|
{
|
|
// Skip white space.
|
|
++_charIndex;
|
|
}
|
|
else
|
|
break;
|
|
}
|
|
|
|
// If there was a separatorChar then we shouldn't be at the end of string or means there was a separator but there isn't an arg.
|
|
if (argSepCount > 0 && _charIndex >= _strLen)
|
|
throw new InvalidOperationException("EmptyToken"); // SR.Get(SRID.TokenizerHelperEmptyToken, new object[0]));
|
|
}
|
|
}
|
|
|
|
public static char GetNumericListSeparator(IFormatProvider provider)
|
|
{
|
|
char numericSeparator = ',';
|
|
NumberFormatInfo numberFormat = NumberFormatInfo.GetInstance(provider);
|
|
if (numberFormat.NumberDecimalSeparator.Length > 0 && numericSeparator == numberFormat.NumberDecimalSeparator[0])
|
|
numericSeparator = ';';
|
|
return numericSeparator;
|
|
}
|
|
|
|
public bool FoundSeparator
|
|
{
|
|
get { return _foundSeparator; }
|
|
}
|
|
bool _foundSeparator;
|
|
|
|
char _argSeparator;
|
|
int _charIndex;
|
|
int _currentTokenIndex;
|
|
int _currentTokenLength;
|
|
char _quoteChar;
|
|
string _str;
|
|
int _strLen;
|
|
}
|
|
} |