internal void ConvertOneEdge(State start, State end, int startCodePoint, int endCodePoint) { startUTF8.Set(startCodePoint); endUTF8.Set(endCodePoint); //System.out.println("start = " + startUTF8); //System.out.println(" end = " + endUTF8); Build(start, end, startUTF8, endUTF8, 0); }
private void Build(State start, State end, UTF8Sequence startUTF8, UTF8Sequence endUTF8, int upto) { // Break into start, middle, end: if (startUTF8.ByteAt(upto) == endUTF8.ByteAt(upto)) { // Degen case: lead with the same byte: if (upto == startUTF8.len - 1 && upto == endUTF8.len - 1) { // Super degen: just single edge, one UTF8 byte: start.AddTransition(new Transition(startUTF8.ByteAt(upto), endUTF8.ByteAt(upto), end)); return; } else { if (Debugging.AssertsEnabled) { Debugging.Assert(startUTF8.len > upto + 1); Debugging.Assert(endUTF8.len > upto + 1); } State n = NewUTF8State(); // Single value leading edge start.AddTransition(new Transition(startUTF8.ByteAt(upto), n)); // type=single // Recurse for the rest Build(n, end, startUTF8, endUTF8, 1 + upto); } } else if (startUTF8.len == endUTF8.len) { if (upto == startUTF8.len - 1) { start.AddTransition(new Transition(startUTF8.ByteAt(upto), endUTF8.ByteAt(upto), end)); // type=startend } else { Start(start, end, startUTF8, upto, false); if (endUTF8.ByteAt(upto) - startUTF8.ByteAt(upto) > 1) { // There is a middle All(start, end, startUTF8.ByteAt(upto) + 1, endUTF8.ByteAt(upto) - 1, startUTF8.len - upto - 1); } End(start, end, endUTF8, upto, false); } } else { // start Start(start, end, startUTF8, upto, true); // possibly middle, spanning multiple num bytes int byteCount = 1 + startUTF8.len - upto; int limit = endUTF8.len - upto; while (byteCount < limit) { // wasteful: we only need first byte, and, we should // statically encode this first byte: tmpUTF8a.Set(startCodes[byteCount - 1]); tmpUTF8b.Set(endCodes[byteCount - 1]); All(start, end, tmpUTF8a.ByteAt(0), tmpUTF8b.ByteAt(0), tmpUTF8a.len - 1); byteCount++; } // end End(start, end, endUTF8, upto, true); } }