| Classes in this File | Line Coverage | Branch Coverage | Complexity | ||||
| StringDecoder |
|
| 2.0;2 |
| 1 | /* | |
| 2 | * #%L | |
| 3 | * StringDecoder.java - mongodb-async-driver - Allanbank Consulting, Inc. | |
| 4 | * %% | |
| 5 | * Copyright (C) 2011 - 2014 Allanbank Consulting, Inc. | |
| 6 | * %% | |
| 7 | * Licensed under the Apache License, Version 2.0 (the "License"); | |
| 8 | * you may not use this file except in compliance with the License. | |
| 9 | * You may obtain a copy of the License at | |
| 10 | * | |
| 11 | * http://www.apache.org/licenses/LICENSE-2.0 | |
| 12 | * | |
| 13 | * Unless required by applicable law or agreed to in writing, software | |
| 14 | * distributed under the License is distributed on an "AS IS" BASIS, | |
| 15 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
| 16 | * See the License for the specific language governing permissions and | |
| 17 | * limitations under the License. | |
| 18 | * #L% | |
| 19 | */ | |
| 20 | ||
| 21 | package com.allanbank.mongodb.bson.io; | |
| 22 | ||
| 23 | import java.io.EOFException; | |
| 24 | import java.io.StreamCorruptedException; | |
| 25 | import java.nio.charset.Charset; | |
| 26 | ||
| 27 | /** | |
| 28 | * StringDecoder provides a decoder for byte arrays into strings that uses a | |
| 29 | * trie data structure to cache recurring strings. | |
| 30 | * <p> | |
| 31 | * This class is <b>not</b> thread safe. | |
| 32 | * </p> | |
| 33 | * | |
| 34 | * @api.no This class is <b>NOT</b> part of the drivers API. This class may be | |
| 35 | * mutated in incompatible ways between any two releases of the driver. | |
| 36 | * @copyright 2013, Allanbank Consulting, Inc., All Rights Reserved | |
| 37 | */ | |
| 38 | public class StringDecoder { | |
| 39 | ||
| 40 | /** UTF-8 Character set for encoding strings. */ | |
| 41 | 1 | /* package */final static Charset UTF8 = Charset.forName("UTF-8"); |
| 42 | ||
| 43 | /** A builder for the ASCII strings. */ | |
| 44 | 3511 | private final StringBuilder myBuilder = new StringBuilder(64); |
| 45 | ||
| 46 | /** The cached decoded strings. */ | |
| 47 | private final StringDecoderCache myCache; | |
| 48 | ||
| 49 | /** | |
| 50 | * Creates a new StringDecoder. | |
| 51 | */ | |
| 52 | public StringDecoder() { | |
| 53 | 2 | this(new StringDecoderCache()); |
| 54 | 2 | } |
| 55 | ||
| 56 | /** | |
| 57 | * Creates a new StringDecoder. | |
| 58 | * | |
| 59 | * @param cache | |
| 60 | * The cache for the decoder. | |
| 61 | */ | |
| 62 | public StringDecoder(final StringDecoderCache cache) { | |
| 63 | 3511 | super(); |
| 64 | ||
| 65 | 3511 | myCache = cache; |
| 66 | 3511 | } |
| 67 | ||
| 68 | /** | |
| 69 | * Decode a string of a known length. The last byte should be a zero byte | |
| 70 | * and will not be included in the decoded string. | |
| 71 | * | |
| 72 | * @param source | |
| 73 | * The source of the bytes in the string. | |
| 74 | * @param offset | |
| 75 | * The offset of the first byte to decode. | |
| 76 | * @param length | |
| 77 | * The length of the string to decode with a terminal zero byte. | |
| 78 | * @return The decoded string. | |
| 79 | * @throws StreamCorruptedException | |
| 80 | * On the decoding of the string failing. | |
| 81 | * @throws EOFException | |
| 82 | * On the array not containing enough bytes to decoded. | |
| 83 | */ | |
| 84 | public String decode(final byte[] source, final int offset, final int length) | |
| 85 | throws StreamCorruptedException, EOFException { | |
| 86 | ||
| 87 | 71517 | String result = myCache.find(source, offset, length); |
| 88 | 71516 | if (result == null) { |
| 89 | 70580 | result = fastDecode(source, offset, length - 1); |
| 90 | } | |
| 91 | ||
| 92 | 71516 | myCache.used(result, source, offset, length); |
| 93 | ||
| 94 | 71516 | return result; |
| 95 | } | |
| 96 | ||
| 97 | /** | |
| 98 | * Returns the cache value. | |
| 99 | * | |
| 100 | * @return The cache value. | |
| 101 | * @deprecated The cache {@link StringDecoderCache} should be controlled | |
| 102 | * directly. This method will be removed after the 2.1.0 | |
| 103 | * release. | |
| 104 | */ | |
| 105 | @Deprecated | |
| 106 | public StringDecoderCache getCache() { | |
| 107 | 0 | return myCache; |
| 108 | } | |
| 109 | ||
| 110 | /** | |
| 111 | * Retrieves or caches the decoded string for the Trie. | |
| 112 | * | |
| 113 | * @param source | |
| 114 | * The source of the bytes in the string. | |
| 115 | * @param offset | |
| 116 | * The offset of the first byte to decode. | |
| 117 | * @param length | |
| 118 | * The length of the string to decode without a terminal zero | |
| 119 | * byte. | |
| 120 | * @return The value for the string. | |
| 121 | */ | |
| 122 | private String fastDecode(final byte[] source, final int offset, | |
| 123 | final int length) { | |
| 124 | // Try to decode as ASCII. | |
| 125 | 70579 | boolean isAscii = true; |
| 126 | 404625 | for (int i = 0; isAscii && (i < length); ++i) { |
| 127 | 334042 | final int b = (source[offset + i] & 0xFF); |
| 128 | 334043 | if (b < 0x80) { |
| 129 | 333977 | myBuilder.append((char) b); |
| 130 | } | |
| 131 | else { | |
| 132 | 67 | isAscii = false; |
| 133 | } | |
| 134 | } | |
| 135 | ||
| 136 | String result; | |
| 137 | 70580 | if (!isAscii) { |
| 138 | 67 | final int encodedLength = myBuilder.length(); |
| 139 | ||
| 140 | 67 | final String remaining = new String(source, offset + encodedLength, |
| 141 | length - encodedLength, UTF8); | |
| 142 | ||
| 143 | 67 | myBuilder.append(remaining); |
| 144 | } | |
| 145 | 70580 | result = myBuilder.toString(); |
| 146 | ||
| 147 | // Clear the string builder. | |
| 148 | 70580 | myBuilder.setLength(0); |
| 149 | ||
| 150 | 70580 | return result; |
| 151 | } | |
| 152 | } |