C# (CSharp) Lucene.Net.Analysis.Standard StandardTokenizerImpl.GetNextToken示例

编程语言: C# (CSharp)

命名空间/包名称: Lucene.Net.Analysis.Standard

方法/功能: GetNextToken

hotexamples.com的示例: 4

C# (CSharp) Lucene.Net.Analysis.Standard StandardTokenizerImpl.GetNextToken - 已找到4个示例。这些是从开源项目中提取的最受好评的Lucene.Net.Analysis.Standard.StandardTokenizerImpl.GetNextToken现实C# (CSharp)示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

GetNextToken(3)

GetText(2)

Yychar(2)

Yylength(2)

GetStandardTokenizerImpl(1)

Reset(1)

Yyreset(1)

yychar(1)

yyclose(1)

yytext(1)

GetNextToken() public method

Resumes scanning until the next regular expression is matched, the end of input is encountered or an I/O-Error occurs.

if any I/O-Error occurs

public GetNextToken ( ) : int
return	int

StandardTokenizerImpl Class Documentation

示例#1

显示文件

文件： StandardTokenizer.cs 项目： restran/lucene-file-finder

        /*
         * (non-Javadoc)
         *
         * @see Lucene.Net.Analysis.TokenStream#next()
         */
        public override Token Next(/* in */ Token reusableToken)
        {
            System.Diagnostics.Debug.Assert(reusableToken != null);
            int posIncr = 1;

            while (true)
            {
                int tokenType = scanner.GetNextToken();

                if (tokenType == StandardTokenizerImpl.YYEOF)
                {
                    return(null);
                }

                if (scanner.Yylength() <= maxTokenLength)
                {
                    reusableToken.Clear();
                    reusableToken.SetPositionIncrement(posIncr);
                    scanner.GetText(reusableToken);
                    int start = scanner.Yychar();
                    reusableToken.SetStartOffset(start);
                    reusableToken.SetEndOffset(start + reusableToken.TermLength());
                    // This 'if' should be removed in the next release. For now, it converts
                    // invalid acronyms to HOST. When removed, only the 'else' part should
                    // remain.
                    if (tokenType == StandardTokenizerImpl.ACRONYM_DEP)
                    {
                        if (replaceInvalidAcronym)
                        {
                            reusableToken.SetType(StandardTokenizerImpl.TOKEN_TYPES[StandardTokenizerImpl.HOST]);
                            reusableToken.SetTermLength(reusableToken.TermLength() - 1);                             // remove extra '.'
                        }
                        else
                        {
                            reusableToken.SetType(StandardTokenizerImpl.TOKEN_TYPES[StandardTokenizerImpl.ACRONYM]);
                        }
                    }
                    else
                    {
                        reusableToken.SetType(StandardTokenizerImpl.TOKEN_TYPES[tokenType]);
                    }
                    return(reusableToken);
                }
                // When we skip a too-long term, we still increment the
                // position increment
                else
                {
                    posIncr++;
                }
            }
        }

示例#2

显示文件

文件： StandardTokenizer.cs 项目： barsgroup/linux-packaging-mono

        ///<summary>
        /// (non-Javadoc)
        /// <see cref="Lucene.Net.Analysis.TokenStream.IncrementToken()" />
        ///</summary>
        public override bool IncrementToken()
        {
            ClearAttributes();
            int posIncr = 1;

            while (true)
            {
                int tokenType = scanner.GetNextToken();

                if (tokenType == StandardTokenizerImpl.YYEOF)
                {
                    return(false);
                }

                if (scanner.Yylength() <= maxTokenLength)
                {
                    posIncrAtt.PositionIncrement = posIncr;
                    scanner.GetText(termAtt);
                    int start = scanner.Yychar();
                    offsetAtt.SetOffset(CorrectOffset(start), CorrectOffset(start + termAtt.TermLength()));
                    // This 'if' should be removed in the next release. For now, it converts
                    // invalid acronyms to HOST. When removed, only the 'else' part should
                    // remain.
                    if (tokenType == StandardTokenizerImpl.ACRONYM_DEP)
                    {
                        if (replaceInvalidAcronym)
                        {
                            typeAtt.Type = StandardTokenizerImpl.TOKEN_TYPES[StandardTokenizerImpl.HOST];
                            termAtt.SetTermLength(termAtt.TermLength() - 1);                             // remove extra '.'
                        }
                        else
                        {
                            typeAtt.Type = StandardTokenizerImpl.TOKEN_TYPES[StandardTokenizerImpl.ACRONYM];
                        }
                    }
                    else
                    {
                        typeAtt.Type = StandardTokenizerImpl.TOKEN_TYPES[tokenType];
                    }
                    return(true);
                }
                // When we skip a too-long term, we still increment the
                // position increment
                else
                {
                    posIncr++;
                }
            }
        }

示例#3

显示文件

文件： BreakWords.cs 项目： zweib730/beagrep

  public static Token Next(StandardTokenizerImpl scanner)
  {
    int tokenType = scanner.GetNextToken();

    if (tokenType == StandardTokenizerImpl.YYEOF) {
      return null;
    }

    int startPosition = scanner.yychar();

    string tokenImage = scanner.yytext();
    return new Token(tokenImage, startPosition, startPosition
                     + tokenImage.Length,
                     StandardTokenizerImpl.TOKEN_TYPES[tokenType]);
  }

示例#4

显示文件

文件： StandardTokenizer.cs 项目： universsky/beagrep

        /// <summary>Returns the next token in the stream, or null at EOS.
        /// <p>The returned token's type is set to an element of {@link
        /// StandardTokenizerConstants#tokenImage}.
        /// </summary>
        public override Lucene.Net.Analysis.Token Next()
        {
            int tokenType = scanner.GetNextToken();

            if (tokenType == StandardTokenizerImpl.YYEOF)
            {
                return(null);
            }

            int startPosition = scanner.yychar();

            string tokenImage = scanner.yytext();

            return(new Token(tokenImage, startPosition, startPosition
                             + tokenImage.Length,
                             StandardTokenizerImpl.TOKEN_TYPES[tokenType]));
        }