2021-09-04 08:06:49 +00:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2021 Huawei Device Co., Ltd.
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
2021-09-07 14:24:16 +00:00
|
|
|
#ifndef ECMASCRIPT_STRING_INL_H
|
|
|
|
#define ECMASCRIPT_STRING_INL_H
|
2021-09-04 08:06:49 +00:00
|
|
|
|
|
|
|
#include "ecmascript/ecma_string.h"
|
2022-08-24 11:25:56 +00:00
|
|
|
#include "ecmascript/base/string_helper.h"
|
2021-09-04 08:06:49 +00:00
|
|
|
#include "ecmascript/ecma_vm.h"
|
|
|
|
#include "ecmascript/js_handle.h"
|
|
|
|
#include "ecmascript/js_tagged_value-inl.h"
|
2024-01-24 13:24:07 +00:00
|
|
|
#include "ecmascript/mem/heap.h"
|
|
|
|
#include "ecmascript/mem/space.h"
|
2022-04-28 12:17:41 +00:00
|
|
|
#include "ecmascript/object_factory-inl.h"
|
2021-09-04 08:06:49 +00:00
|
|
|
|
|
|
|
namespace panda::ecmascript {
|
|
|
|
/* static */
|
|
|
|
inline EcmaString *EcmaString::CreateEmptyString(const EcmaVM *vm)
|
|
|
|
{
|
2022-10-23 15:17:44 +00:00
|
|
|
auto string = vm->GetFactory()->AllocNonMovableLineStringObject(EcmaString::SIZE);
|
2022-08-24 11:25:56 +00:00
|
|
|
string->SetLength(0, true);
|
2022-01-14 13:50:26 +00:00
|
|
|
string->SetRawHashcode(0);
|
2021-09-04 08:06:49 +00:00
|
|
|
return string;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* static */
|
2022-08-24 11:25:56 +00:00
|
|
|
inline EcmaString *EcmaString::CreateFromUtf8(const EcmaVM *vm, const uint8_t *utf8Data, uint32_t utf8Len,
|
2023-05-08 09:07:03 +00:00
|
|
|
bool canBeCompress, MemSpaceType type, bool isConstantString,
|
|
|
|
uint32_t idOffset)
|
2021-09-04 08:06:49 +00:00
|
|
|
{
|
|
|
|
if (utf8Len == 0) {
|
|
|
|
return vm->GetFactory()->GetEmptyString().GetObject<EcmaString>();
|
|
|
|
}
|
|
|
|
EcmaString *string = nullptr;
|
2021-09-07 14:24:16 +00:00
|
|
|
if (canBeCompress) {
|
2023-05-08 09:07:03 +00:00
|
|
|
if (isConstantString) {
|
|
|
|
string = CreateConstantString(vm, utf8Data, utf8Len, canBeCompress, type, idOffset);
|
|
|
|
} else {
|
|
|
|
string = CreateLineStringWithSpaceType(vm, utf8Len, true, type);
|
|
|
|
ASSERT(string != nullptr);
|
2024-02-12 12:04:52 +00:00
|
|
|
std::copy(utf8Data, utf8Data + utf8Len, string->GetDataUtf8Writable());
|
2021-09-04 08:06:49 +00:00
|
|
|
}
|
|
|
|
} else {
|
2022-01-13 04:02:17 +00:00
|
|
|
auto utf16Len = base::utf_helper::Utf8ToUtf16Size(utf8Data, utf8Len);
|
2022-10-23 15:17:44 +00:00
|
|
|
string = CreateLineStringWithSpaceType(vm, utf16Len, false, type);
|
2021-09-04 08:06:49 +00:00
|
|
|
ASSERT(string != nullptr);
|
|
|
|
|
|
|
|
[[maybe_unused]] auto len =
|
2022-01-13 04:02:17 +00:00
|
|
|
base::utf_helper::ConvertRegionUtf8ToUtf16(utf8Data, string->GetDataUtf16Writable(), utf8Len, utf16Len, 0);
|
2021-09-04 08:06:49 +00:00
|
|
|
ASSERT(len == utf16Len);
|
|
|
|
}
|
|
|
|
|
2022-04-19 12:32:45 +00:00
|
|
|
ASSERT_PRINT(canBeCompress == CanBeCompressed(string), "Bad input canBeCompress!");
|
2021-09-04 08:06:49 +00:00
|
|
|
return string;
|
|
|
|
}
|
|
|
|
|
2024-02-12 12:04:52 +00:00
|
|
|
/* static */
|
|
|
|
inline EcmaString *EcmaString::CreateFromUtf8CompressedSubString(const EcmaVM *vm, const JSHandle<EcmaString> &string,
|
|
|
|
uint32_t offset, uint32_t utf8Len, MemSpaceType type)
|
|
|
|
{
|
2024-03-12 11:32:43 +00:00
|
|
|
if (UNLIKELY(utf8Len == 0)) {
|
2024-03-12 06:18:12 +00:00
|
|
|
return vm->GetFactory()->GetEmptyString().GetObject<EcmaString>();
|
|
|
|
}
|
2024-02-12 12:04:52 +00:00
|
|
|
EcmaString *subString = CreateLineStringWithSpaceType(vm, utf8Len, true, type);
|
|
|
|
ASSERT(subString != nullptr);
|
|
|
|
|
|
|
|
auto *utf8Data = string->GetDataUtf8() + offset;
|
|
|
|
std::copy(utf8Data, utf8Data + utf8Len, subString->GetDataUtf8Writable());
|
|
|
|
ASSERT_PRINT(CanBeCompressed(subString), "String cannot be compressed!");
|
|
|
|
return subString;
|
|
|
|
}
|
|
|
|
|
2023-11-23 08:32:20 +00:00
|
|
|
inline EcmaString *EcmaString::CreateUtf16StringFromUtf8(const EcmaVM *vm, const uint8_t *utf8Data, uint32_t utf16Len,
|
|
|
|
MemSpaceType type)
|
|
|
|
{
|
|
|
|
if (utf16Len == 0) {
|
|
|
|
return vm->GetFactory()->GetEmptyString().GetObject<EcmaString>();
|
|
|
|
}
|
|
|
|
auto string = CreateLineStringWithSpaceType(vm, utf16Len, false, type);
|
|
|
|
ASSERT(string != nullptr);
|
|
|
|
auto len = utf::ConvertRegionMUtf8ToUtf16(
|
|
|
|
utf8Data, string->GetDataUtf16Writable(), utf::Mutf8Size(utf8Data), utf16Len, 0);
|
|
|
|
if (len < utf16Len) {
|
|
|
|
string->TrimLineString(vm->GetJSThread(), len);
|
|
|
|
}
|
|
|
|
ASSERT_PRINT(false == CanBeCompressed(string), "Bad input canBeCompress!");
|
|
|
|
return string;
|
|
|
|
}
|
|
|
|
|
|
|
|
inline void EcmaString::TrimLineString(const JSThread *thread, uint32_t newLength)
|
|
|
|
{
|
|
|
|
ASSERT(IsLineString());
|
|
|
|
ObjectFactory *factory = thread->GetEcmaVM()->GetFactory();
|
|
|
|
uint32_t oldLength = GetLength();
|
|
|
|
ASSERT(oldLength > newLength);
|
|
|
|
size_t trimBytes = (oldLength - newLength) * (IsUtf8() ? sizeof(uint8_t) : sizeof(uint16_t));
|
|
|
|
size_t size = IsUtf8() ? LineEcmaString::ComputeSizeUtf8(newLength) : LineEcmaString::ComputeSizeUtf16(newLength);
|
|
|
|
factory->FillFreeObject(ToUintPtr(this) + size, trimBytes, RemoveSlots::YES, ToUintPtr(this));
|
|
|
|
SetLength(newLength, CanBeCompressed(this));
|
|
|
|
}
|
|
|
|
|
2022-08-24 11:25:56 +00:00
|
|
|
inline EcmaString *EcmaString::CreateFromUtf16(const EcmaVM *vm, const uint16_t *utf16Data, uint32_t utf16Len,
|
2022-07-21 09:00:58 +00:00
|
|
|
bool canBeCompress, MemSpaceType type)
|
2021-09-04 08:06:49 +00:00
|
|
|
{
|
|
|
|
if (utf16Len == 0) {
|
|
|
|
return vm->GetFactory()->GetEmptyString().GetObject<EcmaString>();
|
|
|
|
}
|
2022-10-23 15:17:44 +00:00
|
|
|
auto string = CreateLineStringWithSpaceType(vm, utf16Len, canBeCompress, type);
|
2021-09-04 08:06:49 +00:00
|
|
|
ASSERT(string != nullptr);
|
|
|
|
|
2021-09-07 14:24:16 +00:00
|
|
|
if (canBeCompress) {
|
2022-10-23 15:17:44 +00:00
|
|
|
CopyChars(string->GetDataUtf8Writable(), utf16Data, utf16Len);
|
2021-09-04 08:06:49 +00:00
|
|
|
} else {
|
|
|
|
uint32_t len = utf16Len * (sizeof(uint16_t) / sizeof(uint8_t));
|
|
|
|
if (memcpy_s(string->GetDataUtf16Writable(), len, utf16Data, len) != EOK) {
|
2022-07-06 06:12:54 +00:00
|
|
|
LOG_FULL(FATAL) << "memcpy_s failed";
|
2021-09-04 08:06:49 +00:00
|
|
|
UNREACHABLE();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-04-19 12:32:45 +00:00
|
|
|
ASSERT_PRINT(canBeCompress == CanBeCompressed(string), "Bad input canBeCompress!");
|
2021-09-04 08:06:49 +00:00
|
|
|
return string;
|
|
|
|
}
|
|
|
|
|
2022-10-23 15:17:44 +00:00
|
|
|
/* static */
|
|
|
|
inline EcmaString *EcmaString::CreateLineString(const EcmaVM *vm, size_t length, bool compressed)
|
2021-09-04 08:06:49 +00:00
|
|
|
{
|
2022-10-23 15:17:44 +00:00
|
|
|
size_t size = compressed ? LineEcmaString::ComputeSizeUtf8(length) : LineEcmaString::ComputeSizeUtf16(length);
|
|
|
|
auto string = vm->GetFactory()->AllocLineStringObject(size);
|
|
|
|
string->SetLength(length, compressed);
|
|
|
|
string->SetRawHashcode(0);
|
|
|
|
return string;
|
2021-09-04 08:06:49 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* static */
|
2022-10-23 15:17:44 +00:00
|
|
|
inline EcmaString *EcmaString::CreateLineStringNoGC(const EcmaVM *vm, size_t length, bool compressed)
|
2021-09-04 08:06:49 +00:00
|
|
|
{
|
2022-10-23 15:17:44 +00:00
|
|
|
size_t size = compressed ? LineEcmaString::ComputeSizeUtf8(length) : LineEcmaString::ComputeSizeUtf16(length);
|
|
|
|
size = AlignUp(size, static_cast<size_t>(MemAlignment::MEM_ALIGN_OBJECT));
|
2024-03-04 12:53:06 +00:00
|
|
|
auto string = vm->GetFactory()->AllocLineStringObjectNoGC(size);
|
2021-09-04 08:06:49 +00:00
|
|
|
string->SetLength(length, compressed);
|
2022-01-14 13:50:26 +00:00
|
|
|
string->SetRawHashcode(0);
|
2022-05-31 08:29:55 +00:00
|
|
|
return string;
|
|
|
|
}
|
|
|
|
|
2022-10-23 15:17:44 +00:00
|
|
|
/* static */
|
|
|
|
inline EcmaString *EcmaString::CreateLineStringWithSpaceType(const EcmaVM *vm, size_t length, bool compressed,
|
|
|
|
MemSpaceType type)
|
|
|
|
{
|
2024-01-24 13:24:07 +00:00
|
|
|
ASSERT(IsSMemSpace(type));
|
2022-10-23 15:17:44 +00:00
|
|
|
size_t size = compressed ? LineEcmaString::ComputeSizeUtf8(length) : LineEcmaString::ComputeSizeUtf16(length);
|
|
|
|
EcmaString *string = nullptr;
|
|
|
|
switch (type) {
|
2024-01-24 13:24:07 +00:00
|
|
|
case MemSpaceType::SHARED_OLD_SPACE:
|
2022-10-23 15:17:44 +00:00
|
|
|
string = vm->GetFactory()->AllocOldSpaceLineStringObject(size);
|
|
|
|
break;
|
2024-01-24 13:24:07 +00:00
|
|
|
case MemSpaceType::SHARED_NON_MOVABLE:
|
2022-10-23 15:17:44 +00:00
|
|
|
string = vm->GetFactory()->AllocNonMovableLineStringObject(size);
|
|
|
|
break;
|
2024-03-25 06:52:04 +00:00
|
|
|
case MemSpaceType::SHARED_READ_ONLY_SPACE:
|
|
|
|
string = vm->GetFactory()->AllocReadOnlyLineStringObject(size);
|
|
|
|
break;
|
2022-10-23 15:17:44 +00:00
|
|
|
default:
|
2022-12-01 07:29:41 +00:00
|
|
|
LOG_ECMA(FATAL) << "this branch is unreachable";
|
2022-10-23 15:17:44 +00:00
|
|
|
UNREACHABLE();
|
|
|
|
}
|
|
|
|
string->SetLength(length, compressed);
|
|
|
|
string->SetRawHashcode(0);
|
|
|
|
return string;
|
|
|
|
}
|
|
|
|
|
2023-09-01 09:13:25 +00:00
|
|
|
inline SlicedString *EcmaString::CreateSlicedString(const EcmaVM *vm, MemSpaceType type)
|
|
|
|
{
|
|
|
|
auto slicedString = SlicedString::Cast(vm->GetFactory()->AllocSlicedStringObject(type));
|
|
|
|
slicedString->SetRawHashcode(0);
|
2024-03-11 07:16:25 +00:00
|
|
|
slicedString->SetParent(vm->GetJSThread(), JSTaggedValue::Undefined(), BarrierMode::SKIP_BARRIER);
|
2023-09-01 09:13:25 +00:00
|
|
|
return slicedString;
|
|
|
|
}
|
|
|
|
|
2023-05-08 09:07:03 +00:00
|
|
|
inline EcmaString *EcmaString::CreateConstantString(const EcmaVM *vm, const uint8_t *utf8Data,
|
|
|
|
size_t length, bool compressed, MemSpaceType type, uint32_t idOffset)
|
|
|
|
{
|
2024-01-24 13:24:07 +00:00
|
|
|
ASSERT(IsSMemSpace(type));
|
2023-05-08 09:07:03 +00:00
|
|
|
auto string = ConstantString::Cast(vm->GetFactory()->AllocConstantStringObject(type));
|
2023-10-31 02:21:45 +00:00
|
|
|
auto thread = vm->GetJSThread();
|
2023-05-08 09:07:03 +00:00
|
|
|
string->SetLength(length, compressed);
|
|
|
|
string->SetRawHashcode(0);
|
|
|
|
string->SetConstantData(const_cast<uint8_t *>(utf8Data));
|
|
|
|
// The string might be serialized, the const data will be replaced by index in the panda file.
|
|
|
|
string->SetEntityId(idOffset);
|
2023-10-31 02:21:45 +00:00
|
|
|
string->SetRelocatedData(thread, JSTaggedValue::Undefined(), BarrierMode::SKIP_BARRIER);
|
2023-05-08 09:07:03 +00:00
|
|
|
return string;
|
|
|
|
}
|
|
|
|
|
2022-10-23 15:17:44 +00:00
|
|
|
inline EcmaString *EcmaString::CreateTreeString(const EcmaVM *vm,
|
|
|
|
const JSHandle<EcmaString> &left, const JSHandle<EcmaString> &right, uint32_t length, bool compressed)
|
|
|
|
{
|
2023-08-07 12:49:05 +00:00
|
|
|
ECMA_STRING_CHECK_LENGTH_AND_TRHOW(vm, length);
|
2022-10-23 15:17:44 +00:00
|
|
|
auto thread = vm->GetJSThread();
|
|
|
|
auto string = TreeEcmaString::Cast(vm->GetFactory()->AllocTreeStringObject());
|
|
|
|
string->SetLength(length, compressed);
|
|
|
|
string->SetRawHashcode(0);
|
|
|
|
string->SetFirst(thread, left.GetTaggedValue());
|
|
|
|
string->SetSecond(thread, right.GetTaggedValue());
|
|
|
|
return string;
|
|
|
|
}
|
|
|
|
|
2022-06-05 09:39:02 +00:00
|
|
|
/* static */
|
|
|
|
EcmaString *EcmaString::FastSubUtf8String(const EcmaVM *vm, const JSHandle<EcmaString> &src, uint32_t start,
|
2022-06-07 11:58:20 +00:00
|
|
|
uint32_t length)
|
2022-06-05 09:39:02 +00:00
|
|
|
{
|
2023-09-01 09:13:25 +00:00
|
|
|
JSHandle<EcmaString> string(vm->GetJSThread(), CreateLineString(vm, length, true));
|
2022-06-05 09:39:02 +00:00
|
|
|
// NOLINTNEXTLINE(cppcoreguidelines-pro-bounds-pointer-arithmetic)
|
2023-09-01 09:13:25 +00:00
|
|
|
FlatStringInfo srcFlat = FlattenAllString(vm, src);
|
2022-06-07 11:58:20 +00:00
|
|
|
Span<uint8_t> dst(string->GetDataUtf8Writable(), length);
|
2023-09-01 09:13:25 +00:00
|
|
|
Span<const uint8_t> source(srcFlat.GetDataUtf8() + start, length);
|
2022-10-23 15:17:44 +00:00
|
|
|
EcmaString::MemCopyChars(dst, length, source, length);
|
2022-06-05 09:39:02 +00:00
|
|
|
|
2023-09-01 09:13:25 +00:00
|
|
|
ASSERT_PRINT(CanBeCompressed(*string), "canBeCompresse does not match the real value!");
|
|
|
|
return *string;
|
2022-06-05 09:39:02 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* static */
|
|
|
|
EcmaString *EcmaString::FastSubUtf16String(const EcmaVM *vm, const JSHandle<EcmaString> &src, uint32_t start,
|
2022-06-07 11:58:20 +00:00
|
|
|
uint32_t length)
|
2022-06-05 09:39:02 +00:00
|
|
|
{
|
2023-09-01 09:13:25 +00:00
|
|
|
FlatStringInfo srcFlat = FlattenAllString(vm, src);
|
|
|
|
bool canBeCompressed = CanBeCompressed(srcFlat.GetDataUtf16() + start, length);
|
|
|
|
JSHandle<EcmaString> string(vm->GetJSThread(), CreateLineString(vm, length, canBeCompressed));
|
|
|
|
// maybe happen GC,so get srcFlat again
|
|
|
|
srcFlat = FlattenAllString(vm, src);
|
2022-06-05 09:39:02 +00:00
|
|
|
if (canBeCompressed) {
|
|
|
|
// NOLINTNEXTLINE(cppcoreguidelines-pro-bounds-pointer-arithmetic)
|
2023-09-01 09:13:25 +00:00
|
|
|
CopyChars(string->GetDataUtf8Writable(), srcFlat.GetDataUtf16() + start, length);
|
2022-06-05 09:39:02 +00:00
|
|
|
} else {
|
2022-06-07 11:58:20 +00:00
|
|
|
uint32_t len = length * (sizeof(uint16_t) / sizeof(uint8_t));
|
2022-06-05 09:39:02 +00:00
|
|
|
// NOLINTNEXTLINE(cppcoreguidelines-pro-bounds-pointer-arithmetic)
|
2022-06-07 11:58:20 +00:00
|
|
|
Span<uint16_t> dst(string->GetDataUtf16Writable(), length);
|
2023-09-01 09:13:25 +00:00
|
|
|
Span<const uint16_t> source(srcFlat.GetDataUtf16() + start, length);
|
2022-10-23 15:17:44 +00:00
|
|
|
EcmaString::MemCopyChars(dst, len, source, len);
|
2022-06-05 09:39:02 +00:00
|
|
|
}
|
2023-09-01 09:13:25 +00:00
|
|
|
ASSERT_PRINT(canBeCompressed == CanBeCompressed(*string), "canBeCompresse does not match the real value!");
|
|
|
|
return *string;
|
2022-06-05 09:39:02 +00:00
|
|
|
}
|
2022-10-23 15:17:44 +00:00
|
|
|
|
|
|
|
inline uint16_t *EcmaString::GetData() const
|
|
|
|
{
|
|
|
|
ASSERT_PRINT(IsLineString(), "EcmaString: Read data from not LineString");
|
|
|
|
return LineEcmaString::Cast(this)->GetData();
|
|
|
|
}
|
|
|
|
|
|
|
|
inline const uint8_t *EcmaString::GetDataUtf8() const
|
|
|
|
{
|
|
|
|
ASSERT_PRINT(IsUtf8(), "EcmaString: Read data as utf8 for utf16 string");
|
2023-09-01 09:13:25 +00:00
|
|
|
if (IsLineString()) {
|
|
|
|
return reinterpret_cast<uint8_t *>(GetData());
|
2023-05-08 09:07:03 +00:00
|
|
|
}
|
2023-09-01 09:13:25 +00:00
|
|
|
return ConstantString::Cast(this)->GetConstantData();
|
2022-10-23 15:17:44 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
inline const uint16_t *EcmaString::GetDataUtf16() const
|
|
|
|
{
|
|
|
|
LOG_ECMA_IF(!IsUtf16(), FATAL) << "EcmaString: Read data as utf16 for utf8 string";
|
|
|
|
return GetData();
|
|
|
|
}
|
|
|
|
|
|
|
|
inline uint8_t *EcmaString::GetDataUtf8Writable()
|
|
|
|
{
|
|
|
|
ASSERT_PRINT(IsUtf8(), "EcmaString: Read data as utf8 for utf16 string");
|
2023-05-08 09:07:03 +00:00
|
|
|
if (IsConstantString()) {
|
|
|
|
return ConstantString::Cast(this)->GetConstantData();
|
|
|
|
}
|
2022-10-23 15:17:44 +00:00
|
|
|
return reinterpret_cast<uint8_t *>(GetData());
|
|
|
|
}
|
|
|
|
|
|
|
|
inline uint16_t *EcmaString::GetDataUtf16Writable()
|
|
|
|
{
|
|
|
|
LOG_ECMA_IF(!IsUtf16(), FATAL) << "EcmaString: Read data as utf16 for utf8 string";
|
|
|
|
return GetData();
|
|
|
|
}
|
|
|
|
|
2024-07-24 02:59:53 +00:00
|
|
|
inline size_t EcmaString::GetUtf8Length(bool modify, bool isGetBufferSize) const
|
2022-10-23 15:17:44 +00:00
|
|
|
{
|
|
|
|
if (!IsUtf16()) {
|
|
|
|
return GetLength() + 1; // add place for zero in the end
|
|
|
|
}
|
2023-09-01 09:13:25 +00:00
|
|
|
CVector<uint16_t> tmpBuf;
|
|
|
|
const uint16_t *data = GetUtf16DataFlat(this, tmpBuf);
|
2024-07-24 02:59:53 +00:00
|
|
|
return base::utf_helper::Utf16ToUtf8Size(data, GetLength(), modify, isGetBufferSize);
|
2022-10-23 15:17:44 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
template<bool verify>
|
|
|
|
inline uint16_t EcmaString::At(int32_t index) const
|
|
|
|
{
|
|
|
|
int32_t length = static_cast<int32_t>(GetLength());
|
2024-06-09 12:22:15 +00:00
|
|
|
if constexpr (verify) {
|
2022-10-23 15:17:44 +00:00
|
|
|
if ((index < 0) || (index >= length)) {
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
}
|
2023-09-01 09:13:25 +00:00
|
|
|
switch (GetStringType()) {
|
|
|
|
case JSType::LINE_STRING:
|
|
|
|
return LineEcmaString::Cast(this)->Get<verify>(index);
|
|
|
|
case JSType::CONSTANT_STRING:
|
|
|
|
return ConstantString::Cast(this)->Get<verify>(index);
|
|
|
|
case JSType::SLICED_STRING:
|
|
|
|
return SlicedString::Cast(this)->Get<verify>(index);
|
|
|
|
case JSType::TREE_STRING:
|
|
|
|
return TreeEcmaString::Cast(this)->Get<verify>(index);
|
|
|
|
default:
|
|
|
|
LOG_ECMA(FATAL) << "this branch is unreachable";
|
|
|
|
UNREACHABLE();
|
2022-10-23 15:17:44 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-11-01 09:43:38 +00:00
|
|
|
inline Span<const uint8_t> EcmaString::FastToUtf8Span() const
|
|
|
|
{
|
|
|
|
uint32_t strLen = GetLength();
|
|
|
|
ASSERT(IsUtf8());
|
|
|
|
const uint8_t *data = GetDataUtf8();
|
|
|
|
return Span<const uint8_t>(data, strLen);
|
|
|
|
}
|
|
|
|
|
2022-10-23 15:17:44 +00:00
|
|
|
inline void EcmaString::WriteData(uint32_t index, uint16_t src)
|
|
|
|
{
|
|
|
|
ASSERT(index < GetLength());
|
|
|
|
ASSERT(IsLineString());
|
|
|
|
LineEcmaString::Cast(this)->Set(index, src);
|
|
|
|
}
|
|
|
|
|
|
|
|
inline bool EcmaString::IsFlat() const
|
|
|
|
{
|
|
|
|
if (!JSTaggedValue(this).IsTreeString()) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return TreeEcmaString::Cast(this)->IsFlat();
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename Char>
|
|
|
|
void EcmaString::WriteToFlat(EcmaString *src, Char *buf, uint32_t maxLength)
|
|
|
|
{
|
|
|
|
DISALLOW_GARBAGE_COLLECTION;
|
|
|
|
uint32_t length = src->GetLength();
|
|
|
|
if (length == 0) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
while (true) {
|
|
|
|
ASSERT(length <= maxLength && length > 0);
|
|
|
|
ASSERT(length <= src->GetLength());
|
|
|
|
switch (src->GetStringType()) {
|
|
|
|
case JSType::LINE_STRING: {
|
|
|
|
if (src->IsUtf8()) {
|
|
|
|
CopyChars(buf, src->GetDataUtf8(), length);
|
|
|
|
} else {
|
|
|
|
CopyChars(buf, src->GetDataUtf16(), length);
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
}
|
2023-05-08 09:07:03 +00:00
|
|
|
case JSType::CONSTANT_STRING: {
|
|
|
|
ASSERT(src->IsUtf8());
|
|
|
|
CopyChars(buf, src->GetDataUtf8(), length);
|
|
|
|
return;
|
|
|
|
}
|
2022-10-23 15:17:44 +00:00
|
|
|
case JSType::TREE_STRING: {
|
|
|
|
TreeEcmaString *treeSrc = TreeEcmaString::Cast(src);
|
|
|
|
EcmaString *first = EcmaString::Cast(treeSrc->GetFirst());
|
|
|
|
EcmaString *second = EcmaString::Cast(treeSrc->GetSecond());
|
|
|
|
uint32_t firstLength = first->GetLength();
|
|
|
|
uint32_t secondLength = second->GetLength();
|
|
|
|
if (secondLength >= firstLength) {
|
|
|
|
// second string is longer. So recurse over first.
|
|
|
|
WriteToFlat(first, buf, maxLength);
|
|
|
|
if (first == second) {
|
|
|
|
CopyChars(buf + firstLength, buf, firstLength);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
buf += firstLength;
|
|
|
|
maxLength -= firstLength;
|
|
|
|
src = second;
|
|
|
|
length -= firstLength;
|
|
|
|
} else {
|
|
|
|
// first string is longer. So recurse over second.
|
|
|
|
if (secondLength > 0) {
|
|
|
|
if (secondLength == 1) {
|
|
|
|
buf[firstLength] = static_cast<Char>(second->At<false>(0));
|
2023-05-08 09:07:03 +00:00
|
|
|
} else if ((second->IsLineOrConstantString()) && second->IsUtf8()) {
|
2022-10-23 15:17:44 +00:00
|
|
|
CopyChars(buf + firstLength, second->GetDataUtf8(), secondLength);
|
|
|
|
} else {
|
|
|
|
WriteToFlat(second, buf + firstLength, maxLength - firstLength);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
maxLength = firstLength;
|
|
|
|
src = first;
|
|
|
|
length -= secondLength;
|
|
|
|
}
|
|
|
|
continue;
|
|
|
|
}
|
2023-09-01 09:13:25 +00:00
|
|
|
case JSType::SLICED_STRING: {
|
|
|
|
EcmaString *parent = EcmaString::Cast(SlicedString::Cast(src)->GetParent());
|
|
|
|
if (src->IsUtf8()) {
|
|
|
|
CopyChars(buf, parent->GetDataUtf8() + SlicedString::Cast(src)->GetStartIndex(), length);
|
|
|
|
} else {
|
|
|
|
CopyChars(buf, parent->GetDataUtf16() + SlicedString::Cast(src)->GetStartIndex(), length);
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
}
|
2022-10-23 15:17:44 +00:00
|
|
|
default:
|
2022-12-01 07:29:41 +00:00
|
|
|
LOG_ECMA(FATAL) << "this branch is unreachable";
|
2022-10-23 15:17:44 +00:00
|
|
|
UNREACHABLE();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-04-15 01:48:19 +00:00
|
|
|
template <typename Char>
|
|
|
|
void EcmaString::WriteToFlatWithPos(EcmaString *src, Char *buf, uint32_t length, uint32_t pos)
|
|
|
|
{
|
|
|
|
DISALLOW_GARBAGE_COLLECTION;
|
|
|
|
[[ maybe_unused ]] uint32_t maxLength = src->GetLength();
|
|
|
|
if (length == 0) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
while (true) {
|
|
|
|
ASSERT(length + pos <= maxLength && length > 0);
|
|
|
|
ASSERT(length <= src->GetLength());
|
|
|
|
ASSERT(pos >= 0);
|
|
|
|
switch (src->GetStringType()) {
|
|
|
|
case JSType::LINE_STRING: {
|
|
|
|
if (src->IsUtf8()) {
|
|
|
|
CopyChars(buf, src->GetDataUtf8() + pos, length);
|
|
|
|
} else {
|
|
|
|
CopyChars(buf, src->GetDataUtf16() + pos, length);
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
case JSType::CONSTANT_STRING: {
|
|
|
|
ASSERT(src->IsUtf8());
|
|
|
|
CopyChars(buf, src->GetDataUtf8() + pos, length);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
case JSType::TREE_STRING: {
|
|
|
|
TreeEcmaString *treeSrc = TreeEcmaString::Cast(src);
|
|
|
|
EcmaString *first = EcmaString::Cast(treeSrc->GetFirst());
|
|
|
|
ASSERT(first->IsLineString());
|
|
|
|
src = first;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
case JSType::SLICED_STRING: {
|
|
|
|
EcmaString *parent = EcmaString::Cast(SlicedString::Cast(src)->GetParent());
|
|
|
|
if (src->IsUtf8()) {
|
|
|
|
CopyChars(buf, parent->GetDataUtf8() + SlicedString::Cast(src)->GetStartIndex() + pos, length);
|
|
|
|
} else {
|
|
|
|
CopyChars(buf, parent->GetDataUtf16() + SlicedString::Cast(src)->GetStartIndex() + pos, length);
|
|
|
|
}
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
LOG_ECMA(FATAL) << "this branch is unreachable";
|
|
|
|
UNREACHABLE();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-09-01 09:13:25 +00:00
|
|
|
inline const uint8_t *FlatStringInfo::GetDataUtf8() const
|
|
|
|
{
|
|
|
|
return string_->GetDataUtf8() + startIndex_;
|
|
|
|
}
|
|
|
|
|
|
|
|
inline const uint16_t *FlatStringInfo::GetDataUtf16() const
|
|
|
|
{
|
|
|
|
return string_->GetDataUtf16() + startIndex_;
|
|
|
|
}
|
|
|
|
|
|
|
|
inline uint8_t *FlatStringInfo::GetDataUtf8Writable() const
|
|
|
|
{
|
|
|
|
return string_->GetDataUtf8Writable() + startIndex_;
|
|
|
|
}
|
|
|
|
|
2024-04-15 01:48:19 +00:00
|
|
|
inline uint16_t *FlatStringInfo::GetDataUtf16Writable() const
|
|
|
|
{
|
|
|
|
return string_->GetDataUtf16Writable() + startIndex_;
|
|
|
|
}
|
|
|
|
|
2022-10-23 15:17:44 +00:00
|
|
|
inline const uint8_t *EcmaStringAccessor::GetDataUtf8()
|
|
|
|
{
|
|
|
|
return string_->GetDataUtf8();
|
|
|
|
}
|
|
|
|
|
|
|
|
inline const uint16_t *EcmaStringAccessor::GetDataUtf16()
|
|
|
|
{
|
|
|
|
return string_->GetDataUtf16();
|
|
|
|
}
|
|
|
|
|
2024-07-24 02:59:53 +00:00
|
|
|
inline size_t EcmaStringAccessor::GetUtf8Length(bool isGetBufferSize) const
|
2022-10-23 15:17:44 +00:00
|
|
|
{
|
2024-07-24 02:59:53 +00:00
|
|
|
return string_->GetUtf8Length(true, isGetBufferSize);
|
2022-10-23 15:17:44 +00:00
|
|
|
}
|
|
|
|
|
2022-12-26 10:40:19 +00:00
|
|
|
inline void EcmaStringAccessor::ReadData(EcmaString *dst, EcmaString *src,
|
2022-10-23 15:17:44 +00:00
|
|
|
uint32_t start, uint32_t destSize, uint32_t length)
|
|
|
|
{
|
|
|
|
dst->WriteData(src, start, destSize, length);
|
|
|
|
}
|
2023-11-01 09:43:38 +00:00
|
|
|
|
|
|
|
inline Span<const uint8_t> EcmaStringAccessor::FastToUtf8Span()
|
|
|
|
{
|
|
|
|
return string_->FastToUtf8Span();
|
|
|
|
}
|
2022-06-05 09:39:02 +00:00
|
|
|
} // namespace panda::ecmascript
|
2021-09-04 08:06:49 +00:00
|
|
|
#endif
|