Cursor, Winista.Text.HtmlParser.Lex C# (CSharp) 코드 예제들

예제 #1

0

파일 보기

파일: TagNode.cs 프로젝트: JamalAbuDayyeh/slowandsteadyparser

		/// <summary> Print the contents of the tag.</summary>
		/// <returns> An string describing the tag. For text that looks like HTML use #toHtml().
		/// </returns>
		public override System.String ToString()
		{
			System.String text;
			System.String type;
			Cursor start;
			Cursor end;
			System.Text.StringBuilder ret;
			
			text = GetText();
			ret = new System.Text.StringBuilder(20 + text.Length);
			if (IsEndTag())
				type = "End";
			else
				type = "Tag";
			start = new Cursor(Page, StartPosition);
			end = new Cursor(Page, EndPosition);
			ret.Append(type);
			ret.Append(" (");
			ret.Append(start);
			ret.Append(",");
			ret.Append(end);
			ret.Append("): ");
			if (80 < ret.Length + text.Length)
			{
				text = text.Substring(0, (77 - ret.Length) - (0));
				ret.Append(text);
				ret.Append("...");
			}
			else
				ret.Append(text);
			
			return (ret.ToString());
		}

예제 #2

0

파일 보기

파일: Lexer.cs 프로젝트: JamalAbuDayyeh/slowandsteadyparser

		/// <summary> Reset the lexer to start parsing from the beginning again.
		/// The underlying components are reset such that the next call to
		/// <code>nextNode()</code> will return the first lexeme on the page.
		/// </summary>
		public virtual void Reset()
		{
			Page.Reset();
			Cursor = new Cursor(Page, 0);
		}

예제 #3

0

파일 보기

파일: PageIndex.cs 프로젝트: JamalAbuDayyeh/slowandsteadyparser

		/// <summary> Fetch the object at the given index.</summary>
		/// <param name="index">The item number to get.
		/// </param>
		/// <param name="reuse">If this argument is not null, it is an object
		/// acquired from a previous fetch that is no longer needed and
		/// may be returned as the result if it makes mores sense to alter
		/// and return it than to fetch or create a new element. That is, the
		/// reuse object is garbage and may be used to avoid allocating a new
		/// object if that would normally be the strategy.
		/// </param>
		/// <returns> The Ordered object at that index.
		/// </returns>
		public virtual IOrdered Fetch(int index, IOrdered reuse)
		{
			Cursor ret;
			
			if (null != reuse)
			{
				ret = (Cursor) reuse;
				ret.mPosition = mIndices[index];
				ret.mPage = Page; // redundant
			}
			else
				ret = new Cursor(Page, mIndices[index]);
			
			return (ret);
		}

예제 #4

0

파일 보기

파일: PageIndex.cs 프로젝트: JamalAbuDayyeh/slowandsteadyparser

		/// <summary> Add an element to the list</summary>
		/// <param name="cursor">The element to add.
		/// </param>
		/// <returns> The position at which the element was inserted or
		/// the index of the existing element if it is a duplicate.
		/// </returns>
		public virtual int Add(Cursor cursor)
		{
			int position;
			int last;
			int ret;
			
			position = cursor.Position;
			if (0 == mCount)
			{
				ret = 0;
				InsertElementAt(position, ret);
			}
			else
			{
				last = mIndices[mCount - 1];
				if (position == last)
					ret = mCount - 1;
				else if (position > last)
				{
					ret = mCount;
					InsertElementAt(position, ret);
				}
				else
				{
					// find where it goes
					ret = SortImpl.Bsearch(this, cursor);
					
					// insert, but not twice
					if (!((ret < Size()) && (position == mIndices[ret])))
						InsertElementAt(position, ret);
				}
			}
			
			return (ret);
		}

예제 #5

0

파일 보기

파일: PageIndex.cs 프로젝트: JamalAbuDayyeh/slowandsteadyparser

		/// <summary> Get the line number for a cursor.</summary>
		/// <param name="cursor">The character offset into the page.
		/// </param>
		/// <returns> The line number the character is in.
		/// </returns>
		public virtual int Row(Cursor cursor)
		{
			int ret;
			
			ret = SortImpl.Bsearch(this, cursor);
			// handle line transition, the search returns the index if it matches
			// exactly one of the line end positions, so we advance one line if
			// it's equal to the offset at the row index, since that position is
			// actually the beginning of the next line
			if ((ret < mCount) && (cursor.Position == mIndices[ret]))
				ret++;
			
			return (ret);
		}

예제 #6

0

파일 보기

파일: PageIndex.cs 프로젝트: JamalAbuDayyeh/slowandsteadyparser

		/// <summary> Get the column number for a cursor.</summary>
		/// <param name="cursor">The character offset into the page.
		/// </param>
		/// <returns> The character offset into the line this cursor is on.
		/// </returns>
		public virtual int Column(Cursor cursor)
		{
			int row;
			int previous;
			
			row = Row(cursor);
			if (0 != row)
				previous = this.ElementAt(row - 1);
			else
				previous = 0;
			
			return (cursor.Position - previous);
		}

예제 #7

0

파일 보기

파일: TextNode.cs 프로젝트: JamalAbuDayyeh/slowandsteadyparser

		/// <summary> Express this string node as a printable string
		/// This is suitable for display in a debugger or output to a printout.
		/// Control characters are replaced by their equivalent escape
		/// sequence and contents is truncated to 80 characters.
		/// </summary>
		/// <returns> A string representation of the string node.
		/// </returns>
		public override System.String ToString()
		{
			int startpos;
			int endpos;
			Cursor start;
			Cursor end;
			char c;
			System.Text.StringBuilder ret;
			
			startpos = StartPosition;
			endpos = EndPosition;
			ret = new System.Text.StringBuilder(endpos - startpos + 20);
			if (null == mText)
			{
				start = new Cursor(Page, startpos);
				end = new Cursor(Page, endpos);
				ret.Append("Txt (");
				ret.Append(start);
				ret.Append(",");
				ret.Append(end);
				ret.Append("): ");
				while (start.Position < endpos)
				{
					try
					{
						c = mPage.GetCharacter(start);
						switch (c)
						{
							
							case '\t': 
								ret.Append("\\t");
								break;
							
							case '\n': 
								ret.Append("\\n");
								break;
							
							case '\r': 
								ret.Append("\\r");
								break;
							
							default: 
								ret.Append(c);
								break;
							
						}
					}
					catch (ParserException pe)
					{
						// not really expected, but we're only doing toString, so ignore
					}
					if (77 <= ret.Length)
					{
						ret.Append("...");
						break;
					}
				}
			}
			else
			{
				ret.Append("Txt (");
				ret.Append(startpos);
				ret.Append(",");
				ret.Append(endpos);
				ret.Append("): ");
				for (int i = 0; i < mText.Length; i++)
				{
					c = mText[i];
					switch (c)
					{
						
						case '\t': 
							ret.Append("\\t");
							break;
						
						case '\n': 
							ret.Append("\\n");
							break;
						
						case '\r': 
							ret.Append("\\r");
							break;
						
						default: 
							ret.Append(c);
							break;
						
					}
					if (77 <= ret.Length)
					{
						ret.Append("...");
						break;
					}
				}
			}
			
			return (ret.ToString());
		}

예제 #8

0

파일 보기

파일: ScriptDecoder.cs 프로젝트: JamalAbuDayyeh/slowandsteadyparser

		/// <summary> Decode script encoded by the Microsoft obfuscator.</summary>
		/// <param name="page">The source for encoded text.
		/// </param>
		/// <param name="cursor">The position at which to start decoding.
		/// This is advanced to the end of the encoded text.
		/// </param>
		/// <returns> The plaintext.
		/// </returns>
		/// <exception cref="ParserException">If an error is discovered while decoding.
		/// </exception>
		public static System.String Decode(Page page, Cursor cursor)
		{
			int state;
			int substate_initial;
			int substate_length;
			int substate_prefix;
			int substate_checksum;
			int substate_final;
			long checksum;
			long length;
			char[] buffer;
			buffer = new char[6];
			int index;
			char character;
			int input_character;
			bool found;
			System.Text.StringBuilder ret;
			
			ret = new System.Text.StringBuilder(1024);
			
			state = STATE_INITIAL;
			substate_initial = 0;
			substate_length = 0;
			substate_prefix = 0;
			substate_checksum = 0;
			substate_final = 0;
			length = 0L;
			checksum = 0L;
			index = 0;
			while (STATE_DONE != state)
			{
				input_character = page.GetCharacter(cursor);
				character = (char) input_character;
				if (Page.EOF == input_character)
				{
					if ((STATE_INITIAL != state) || (0 != substate_initial) || (0 != substate_length) || (0 != substate_prefix) || (0 != substate_checksum) || (0 != substate_final))
						throw new ParserException("illegal state for exit");
					state = STATE_DONE;
				}
				else
					switch (state)
					{
						
						case STATE_INITIAL: 
							if (character == mLeader[substate_initial])
							{
								substate_initial++;
								if (substate_initial == mLeader.Length)
								{
									substate_initial = 0;
									state = STATE_LENGTH;
								}
							}
							else
							{
								// oops, flush
								for (int k = 0; 0 < substate_initial; k++)
								{
									ret.Append(mLeader[k++]);
									substate_initial--;
								}
								ret.Append(character);
							}
							break;
						
						
						case STATE_LENGTH: 
							buffer[substate_length] = character;
							substate_length++;
							if (substate_length >= buffer.Length)
							{
								length = DecodeBase64(buffer);
								if (0 > length)
									throw new ParserException("illegal length: " + length);
								substate_length = 0;
								state = STATE_PREFIX;
							}
							break;
						
						
						case STATE_PREFIX: 
							if (character == mPrefix[substate_prefix])
								substate_prefix++;
							else
								throw new ParserException("illegal character encountered: " + (int) character + " ('" + character + "')");
							if (substate_prefix >= mPrefix.Length)
							{
								substate_prefix = 0;
								state = STATE_DECODE;
							}
							break;
						
						
						case STATE_DECODE: 
							if ('@' == character)
								state = STATE_ESCAPE;
							else
							{
								if (input_character < 0x80)
								{
									if (input_character == '\t')
										input_character = 0;
									else if (input_character >= ' ')
										input_character -= (' ' - 1);
									else
										throw new ParserException("illegal encoded character: " + input_character + " ('" + character + "')");
									char ch = mLookupTable[mEncodingIndex[index % 64]][input_character];
									ret.Append(ch);
									checksum += ch;
									index++;
								}
								else
									ret.Append(character);
							}
							length--;
							if (0 == length)
							{
								index = 0;
								state = STATE_CHECKSUM;
							}
							break;
						
						
						case STATE_ESCAPE: 
							found = false;
							for (int i = 0; i < mEscapes.Length; i++)
								if (character == mEscapes[i])
								{
									found = true;
									character = mEscaped[i];
								}
							if (!found)
								throw new ParserException("unexpected escape character: " + (int) character + " ('" + character + "')");
							ret.Append(character);
							checksum += character;
							index++;
							state = STATE_DECODE;
							length--;
							if (0 == length)
							{
								index = 0;
								state = STATE_CHECKSUM;
							}
							break;
						
						
						case STATE_CHECKSUM: 
							buffer[substate_checksum] = character;
							substate_checksum++;
							if (substate_checksum >= buffer.Length)
							{
								long check = DecodeBase64(buffer);
								if (check != checksum)
									throw new ParserException("incorrect checksum, expected " + check + ", calculated " + checksum);
								checksum = 0;
								substate_checksum = 0;
								state = STATE_FINAL;
							}
							break;
						
						
						case STATE_FINAL: 
							if (character == mTrailer[substate_final])
								substate_final++;
							else
								throw new ParserException("illegal character encountered: " + (int) character + " ('" + character + "')");
							if (substate_final >= mTrailer.Length)
							{
								substate_final = 0;
								state = LAST_STATE;
							}
							break;
						
						default: 
							throw new ParserException("invalid state: " + state);
						
					}
			}
			
			return (ret.ToString());
		}

예제 #9

0

파일 보기