forked from mirrors/gecko-dev
		
	
		
			
				
	
	
		
			223 lines
		
	
	
	
		
			6.4 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			223 lines
		
	
	
	
		
			6.4 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /* This Source Code Form is subject to the terms of the Mozilla Public
 | |
|  * License, v. 2.0. If a copy of the MPL was not distributed with this
 | |
|  * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
 | |
| 
 | |
| #include "mozilla/dom/TextDecoder.h"
 | |
| #include "mozilla/dom/EncodingUtils.h"
 | |
| #include "nsContentUtils.h"
 | |
| #include "nsICharsetConverterManager.h"
 | |
| #include "nsServiceManagerUtils.h"
 | |
| 
 | |
| namespace mozilla {
 | |
| namespace dom {
 | |
| 
 | |
| static const PRUnichar kReplacementChar = static_cast<PRUnichar>(0xFFFD);
 | |
| 
 | |
| void
 | |
| TextDecoder::Init(const nsAString& aEncoding,
 | |
|                   const TextDecoderOptions& aFatal,
 | |
|                   ErrorResult& aRv)
 | |
| {
 | |
|   nsAutoString label(aEncoding);
 | |
|   EncodingUtils::TrimSpaceCharacters(label);
 | |
| 
 | |
|   // Let encoding be the result of getting an encoding from label.
 | |
|   // If encoding is failure, throw a TypeError.
 | |
|   if (!EncodingUtils::FindEncodingForLabel(label, mEncoding)) {
 | |
|     aRv.ThrowTypeError(MSG_ENCODING_NOT_SUPPORTED, &label);
 | |
|     return;
 | |
|   }
 | |
| 
 | |
|   mIsUTF16Family = mEncoding.EqualsLiteral("UTF-16LE") ||
 | |
|                    mEncoding.EqualsLiteral("UTF-16BE");
 | |
| 
 | |
|   // If the constructor is called with an options argument,
 | |
|   // and the fatal property of the dictionary is set,
 | |
|   // set the internal fatal flag of the decoder object.
 | |
|   mFatal = aFatal.fatal;
 | |
| 
 | |
|   // Create a decoder object for mEncoding.
 | |
|   nsCOMPtr<nsICharsetConverterManager> ccm =
 | |
|     do_GetService(NS_CHARSETCONVERTERMANAGER_CONTRACTID);
 | |
|   if (!ccm) {
 | |
|     aRv.Throw(NS_ERROR_UNEXPECTED);
 | |
|     return;
 | |
|   }
 | |
| 
 | |
|   ccm->GetUnicodeDecoderRaw(mEncoding.get(), getter_AddRefs(mDecoder));
 | |
|   if (!mDecoder) {
 | |
|     aRv.Throw(NS_ERROR_UNEXPECTED);
 | |
|     return;
 | |
|   }
 | |
| 
 | |
|   if (mFatal) {
 | |
|     mDecoder->SetInputErrorBehavior(nsIUnicodeDecoder::kOnError_Signal);
 | |
|   }
 | |
| }
 | |
| 
 | |
| void
 | |
| TextDecoder::ResetDecoder()
 | |
| {
 | |
|   mDecoder->Reset();
 | |
|   mOffset = 0;
 | |
| }
 | |
| 
 | |
| void
 | |
| TextDecoder::Decode(const ArrayBufferView* aView,
 | |
|                     const TextDecodeOptions& aOptions,
 | |
|                     nsAString& aOutDecodedString,
 | |
|                     ErrorResult& aRv)
 | |
| {
 | |
|   const char* data;
 | |
|   uint32_t length;
 | |
|   // If view is not specified, let view be a Uint8Array of length 0.
 | |
|   if (!aView) {
 | |
|     data = EmptyCString().BeginReading();
 | |
|     length = EmptyCString().Length();
 | |
|   } else {
 | |
|     data = reinterpret_cast<const char*>(aView->Data());
 | |
|     length = aView->Length();
 | |
|   }
 | |
| 
 | |
|   aOutDecodedString.Truncate();
 | |
|   if (mIsUTF16Family && mOffset < 2) {
 | |
|     HandleBOM(data, length, aOptions, aOutDecodedString, aRv);
 | |
|     if (aRv.Failed() || mOffset < 2) {
 | |
|       return;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   // Run or resume the decoder algorithm of the decoder object's encoder.
 | |
|   int32_t outLen;
 | |
|   nsresult rv = mDecoder->GetMaxLength(data, length, &outLen);
 | |
|   if (NS_FAILED(rv)) {
 | |
|     aRv.Throw(rv);
 | |
|     return;
 | |
|   }
 | |
|   // Need a fallible allocator because the caller may be a content
 | |
|   // and the content can specify the length of the string.
 | |
|   static const fallible_t fallible = fallible_t();
 | |
|   nsAutoArrayPtr<PRUnichar> buf(new (fallible) PRUnichar[outLen + 1]);
 | |
|   if (!buf) {
 | |
|     aRv.Throw(NS_ERROR_OUT_OF_MEMORY);
 | |
|     return;
 | |
|   }
 | |
| 
 | |
|   for (;;) {
 | |
|     int32_t srcLen = length;
 | |
|     int32_t dstLen = outLen;
 | |
|     rv = mDecoder->Convert(data, &srcLen, buf, &dstLen);
 | |
|     // Convert will convert the input partially even if the status
 | |
|     // indicates a failure.
 | |
|     buf[dstLen] = 0;
 | |
|     aOutDecodedString.Append(buf, dstLen);
 | |
|     if (mFatal || rv != NS_ERROR_ILLEGAL_INPUT) {
 | |
|       break;
 | |
|     }
 | |
|     // Emit a decode error manually because some decoders
 | |
|     // do not support kOnError_Recover (bug 638379)
 | |
|     if (srcLen == -1) {
 | |
|       ResetDecoder();
 | |
|     } else {
 | |
|       data += srcLen + 1;
 | |
|       length -= srcLen + 1;
 | |
|       aOutDecodedString.Append(kReplacementChar);
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   // If the internal streaming flag of the decoder object is not set,
 | |
|   // then reset the encoding algorithm state to the default values
 | |
|   if (!aOptions.stream) {
 | |
|     ResetDecoder();
 | |
|     if (rv == NS_OK_UDEC_MOREINPUT) {
 | |
|       if (mFatal) {
 | |
|         aRv.Throw(NS_ERROR_DOM_ENCODING_DECODE_ERR);
 | |
|       } else {
 | |
|         // Need to emit a decode error manually
 | |
|         // to simulate the EOF handling of the Encoding spec.
 | |
|         aOutDecodedString.Append(kReplacementChar);
 | |
|       }
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   if (NS_FAILED(rv)) {
 | |
|     aRv.Throw(NS_ERROR_DOM_ENCODING_DECODE_ERR);
 | |
|   }
 | |
| }
 | |
| 
 | |
| void
 | |
| TextDecoder::HandleBOM(const char*& aData, uint32_t& aLength,
 | |
|                        const TextDecodeOptions& aOptions,
 | |
|                        nsAString& aOutString, ErrorResult& aRv)
 | |
| {
 | |
|   if (aLength < 2u - mOffset) {
 | |
|     if (aOptions.stream) {
 | |
|       memcpy(mInitialBytes + mOffset, aData, aLength);
 | |
|       mOffset += aLength;
 | |
|     } else if (mFatal) {
 | |
|       aRv.Throw(NS_ERROR_DOM_ENCODING_DECODE_ERR);
 | |
|     } else {
 | |
|       aOutString.Append(kReplacementChar);
 | |
|     }
 | |
|     return;
 | |
|   }
 | |
| 
 | |
|   memcpy(mInitialBytes + mOffset, aData, 2 - mOffset);
 | |
|   // copied data will be fed later.
 | |
|   aData += 2 - mOffset;
 | |
|   aLength -= 2 - mOffset;
 | |
|   mOffset = 2;
 | |
| 
 | |
|   nsAutoCString encoding;
 | |
|   if (!EncodingUtils::IdentifyDataOffset(mInitialBytes, 2, encoding) ||
 | |
|       !encoding.Equals(mEncoding)) {
 | |
|     // If the stream doesn't start with BOM or the BOM doesn't match the
 | |
|     // encoding, feed a BOM to workaround decoder's bug (bug 634541).
 | |
|     FeedBytes(mEncoding.EqualsLiteral("UTF-16LE") ? "\xFF\xFE" : "\xFE\xFF");
 | |
|   }
 | |
|   FeedBytes(mInitialBytes, &aOutString);
 | |
| }
 | |
| 
 | |
| void
 | |
| TextDecoder::FeedBytes(const char* aBytes, nsAString* aOutString)
 | |
| {
 | |
|   PRUnichar buf[3];
 | |
|   int32_t srcLen = mOffset;
 | |
|   int32_t dstLen = mozilla::ArrayLength(buf);
 | |
|   DebugOnly<nsresult> rv =
 | |
|     mDecoder->Convert(aBytes, &srcLen, buf, &dstLen);
 | |
|   MOZ_ASSERT(NS_SUCCEEDED(rv));
 | |
|   MOZ_ASSERT(srcLen == mOffset);
 | |
|   if (aOutString) {
 | |
|     aOutString->Assign(buf, dstLen);
 | |
|   }
 | |
| }
 | |
| 
 | |
| void
 | |
| TextDecoder::GetEncoding(nsAString& aEncoding)
 | |
| {
 | |
|   // Our utf-16 converter does not comply with the Encoding Standard.
 | |
|   // As a result the utf-16le converter is used for the encoding label
 | |
|   // "utf-16".
 | |
|   // This workaround should not be exposed to the public API and so "utf-16"
 | |
|   // is returned by GetEncoding() if the internal encoding name is "utf-16le".
 | |
|   if (mEncoding.EqualsLiteral("UTF-16LE")) {
 | |
|     aEncoding.AssignLiteral("utf-16");
 | |
|     return;
 | |
|   }
 | |
| 
 | |
|   CopyASCIItoUTF16(mEncoding, aEncoding);
 | |
|   nsContentUtils::ASCIIToLower(aEncoding);
 | |
| }
 | |
| 
 | |
| NS_IMPL_CYCLE_COLLECTING_ADDREF(TextDecoder)
 | |
| NS_IMPL_CYCLE_COLLECTING_RELEASE(TextDecoder)
 | |
| 
 | |
| NS_INTERFACE_MAP_BEGIN_CYCLE_COLLECTION(TextDecoder)
 | |
|   NS_INTERFACE_MAP_ENTRY(nsISupports)
 | |
| NS_INTERFACE_MAP_END
 | |
| 
 | |
| NS_IMPL_CYCLE_COLLECTION_WRAPPERCACHE_1(TextDecoder, mGlobal)
 | |
| 
 | |
| } // dom
 | |
| } // mozilla
 | 
