1 /**
2 * Copyright (c) 2023-2024 Huawei Device Co., Ltd.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15 #include "operands.h"
16 #include "codegen.h"
17 #include "compiler/optimizer/ir/analysis.h"
18 #include "runtime/include/coretypes/string.h"
19 #include "runtime/include/coretypes/array.h"
20
21 namespace ark::compiler {
22
23 class SbAppendArgs {
24 private:
25 Reg dst_;
26 Reg builder_;
27 Reg value_;
28
29 public:
30 SbAppendArgs() = delete;
SbAppendArgs(Reg dst,Reg builder,Reg value)31 SbAppendArgs(Reg dst, Reg builder, Reg value) : dst_(dst), builder_(builder), value_(value)
32 {
33 ASSERT(dst_ != INVALID_REGISTER);
34 ASSERT(builder_ != INVALID_REGISTER);
35 ASSERT(value_ != INVALID_REGISTER);
36 }
Dst() const37 Reg Dst() const
38 {
39 return dst_;
40 }
Builder() const41 Reg Builder() const
42 {
43 return builder_;
44 }
Value() const45 Reg Value() const
46 {
47 return value_;
48 }
DstCanBeUsedAsTemp() const49 bool DstCanBeUsedAsTemp() const
50 {
51 return (dst_.GetId() != builder_.GetId() && dst_.GetId() != value_.GetId());
52 }
SbBufferAddr() const53 MemRef SbBufferAddr() const
54 {
55 return MemRef(builder_, RuntimeInterface::GetSbBufferOffset());
56 }
SbIndexAddr() const57 MemRef SbIndexAddr() const
58 {
59 return MemRef(builder_, RuntimeInterface::GetSbIndexOffset());
60 }
SbCompressAddr() const61 MemRef SbCompressAddr() const
62 {
63 return MemRef(builder_, RuntimeInterface::GetSbCompressOffset());
64 }
SbLengthAddr() const65 MemRef SbLengthAddr() const
66 {
67 return MemRef(builder_, RuntimeInterface::GetSbLengthOffset());
68 }
69 };
70
CreateMathTrunc(IntrinsicInst * inst,Reg dst,SRCREGS src)71 void Codegen::CreateMathTrunc([[maybe_unused]] IntrinsicInst *inst, Reg dst, SRCREGS src)
72 {
73 GetEncoder()->EncodeTrunc(dst, src[0]);
74 }
75
CreateMathRoundAway(IntrinsicInst * inst,Reg dst,SRCREGS src)76 void Codegen::CreateMathRoundAway([[maybe_unused]] IntrinsicInst *inst, Reg dst, SRCREGS src)
77 {
78 GetEncoder()->EncodeRoundAway(dst, src[0]);
79 }
80
CreateArrayCopyTo(IntrinsicInst * inst,Reg dst,SRCREGS src)81 void Codegen::CreateArrayCopyTo(IntrinsicInst *inst, [[maybe_unused]] Reg dst, SRCREGS src)
82 {
83 auto entrypointId = EntrypointId::INVALID;
84
85 switch (inst->GetIntrinsicId()) {
86 case RuntimeInterface::IntrinsicId::INTRINSIC_STD_CORE_BOOL_COPY_TO:
87 case RuntimeInterface::IntrinsicId::INTRINSIC_STD_CORE_BYTE_COPY_TO:
88 entrypointId = EntrypointId::ARRAY_COPY_TO_1B;
89 break;
90
91 case RuntimeInterface::IntrinsicId::INTRINSIC_STD_CORE_CHAR_COPY_TO:
92 case RuntimeInterface::IntrinsicId::INTRINSIC_STD_CORE_SHORT_COPY_TO:
93 entrypointId = EntrypointId::ARRAY_COPY_TO_2B;
94 break;
95
96 case RuntimeInterface::IntrinsicId::INTRINSIC_STD_CORE_INT_COPY_TO:
97 case RuntimeInterface::IntrinsicId::INTRINSIC_STD_CORE_FLOAT_COPY_TO:
98 entrypointId = EntrypointId::ARRAY_COPY_TO_4B;
99 break;
100
101 case RuntimeInterface::IntrinsicId::INTRINSIC_STD_CORE_LONG_COPY_TO:
102 case RuntimeInterface::IntrinsicId::INTRINSIC_STD_CORE_DOUBLE_COPY_TO:
103 entrypointId = EntrypointId::ARRAY_COPY_TO_8B;
104 break;
105
106 default:
107 UNREACHABLE();
108 break;
109 }
110
111 ASSERT(entrypointId != EntrypointId::COUNT);
112
113 auto srcObj = src[FIRST_OPERAND];
114 auto dstObj = src[SECOND_OPERAND];
115 auto dstStart = src[THIRD_OPERAND];
116 auto srcStart = src[FOURTH_OPERAND];
117 auto srcEnd = src[FIFTH_OPERAND];
118 CallFastPath(inst, entrypointId, INVALID_REGISTER, RegMask::GetZeroMask(), srcObj, dstObj, dstStart, srcStart,
119 srcEnd);
120 }
121
122 // Generates a call to StringBuilder.append() for values (EtsBool/Char/Bool/Short/Int/Long),
123 // which are translated to array of utf16 chars.
GenerateSbAppendCall(Codegen * cg,IntrinsicInst * inst,SbAppendArgs args,RuntimeInterface::EntrypointId entrypoint)124 static inline void GenerateSbAppendCall(Codegen *cg, IntrinsicInst *inst, SbAppendArgs args,
125 RuntimeInterface::EntrypointId entrypoint)
126 {
127 auto *runtime = cg->GetGraph()->GetRuntime();
128 if (cg->GetGraph()->IsAotMode()) {
129 auto *enc = cg->GetEncoder();
130 ScopedTmpReg klass(enc);
131 enc->EncodeLdr(klass, false, MemRef(cg->ThreadReg(), runtime->GetArrayU16ClassPointerTlsOffset(cg->GetArch())));
132 cg->CallFastPath(inst, entrypoint, args.Dst(), {}, args.Builder(), args.Value(), klass);
133 } else {
134 auto klass = TypedImm(reinterpret_cast<uintptr_t>(runtime->GetArrayU16Class(cg->GetGraph()->GetMethod())));
135 cg->CallFastPath(inst, entrypoint, args.Dst(), {}, args.Builder(), args.Value(), klass);
136 }
137 }
138
CreateStringBuilderAppendNumber(IntrinsicInst * inst,Reg dst,SRCREGS src)139 void Codegen::CreateStringBuilderAppendNumber(IntrinsicInst *inst, Reg dst, SRCREGS src)
140 {
141 auto sb = src[FIRST_OPERAND];
142 auto num = src[SECOND_OPERAND];
143 auto type = ConvertDataType(DataType::INT64, GetArch());
144 ScopedTmpReg tmp(GetEncoder(), type);
145
146 if (num.GetType() != INT64_TYPE) {
147 ASSERT(num.GetType() == INT32_TYPE || num.GetType() == INT16_TYPE || num.GetType() == INT8_TYPE);
148 if (dst.GetId() != sb.GetId() && dst.GetId() != num.GetId()) {
149 GetEncoder()->EncodeCast(dst.As(type), true, num, true);
150 num = dst.As(type);
151 } else {
152 GetEncoder()->EncodeCast(tmp, true, num, true);
153 num = tmp.GetReg();
154 }
155 }
156 GenerateSbAppendCall(this, inst, SbAppendArgs(dst, sb, num), EntrypointId::STRING_BUILDER_APPEND_LONG);
157 }
158
CreateStringBuilderAppendChar(IntrinsicInst * inst,Reg dst,SRCREGS src)159 void Codegen::CreateStringBuilderAppendChar(IntrinsicInst *inst, Reg dst, SRCREGS src)
160 {
161 ASSERT(IsCompressedStringsEnabled());
162 auto entrypoint = EntrypointId::STRING_BUILDER_APPEND_CHAR_COMPRESSED;
163 SbAppendArgs args(dst, src[FIRST_OPERAND], src[SECOND_OPERAND]);
164 GenerateSbAppendCall(this, inst, args, entrypoint);
165 }
166
CreateStringBuilderAppendBool(IntrinsicInst * inst,Reg dst,SRCREGS src)167 void Codegen::CreateStringBuilderAppendBool(IntrinsicInst *inst, Reg dst, SRCREGS src)
168 {
169 SbAppendArgs args(dst, src[FIRST_OPERAND], src[SECOND_OPERAND]);
170 GenerateSbAppendCall(this, inst, args, EntrypointId::STRING_BUILDER_APPEND_BOOL);
171 }
172
EncodeSbAppendNullString(Codegen * cg,IntrinsicInst * inst,Reg dst,Reg builder)173 static inline void EncodeSbAppendNullString(Codegen *cg, IntrinsicInst *inst, Reg dst, Reg builder)
174 {
175 auto entrypoint = RuntimeInterface::EntrypointId::STRING_BUILDER_APPEND_NULL_STRING;
176 cg->CallRuntime(inst, entrypoint, dst, {}, builder);
177 }
178
EncodeSbInsertStringIntoSlot(Codegen * cg,IntrinsicInst * inst,Reg slot,SbAppendArgs args)179 static inline void EncodeSbInsertStringIntoSlot(Codegen *cg, IntrinsicInst *inst, Reg slot, SbAppendArgs args)
180 {
181 ASSERT(slot.IsValid());
182 auto slotMemRef = MemRef(slot.As(Codegen::ConvertDataType(DataType::REFERENCE, cg->GetArch())));
183 RegMask preserved(MakeMask(args.Builder().GetId(), args.Value().GetId(), slot.GetId()));
184 cg->CreatePreWRB(inst, slotMemRef, preserved);
185 cg->GetEncoder()->EncodeStr(args.Value(), slotMemRef);
186 preserved.Reset(slot.GetId());
187 cg->CreatePostWRB(inst, slotMemRef, args.Value(), INVALID_REGISTER, preserved);
188 }
189
EncodeSbAppendString(Codegen * cg,IntrinsicInst * inst,const SbAppendArgs & args,LabelHolder::LabelId labelReturn,LabelHolder::LabelId labelSlowPath)190 static void EncodeSbAppendString(Codegen *cg, IntrinsicInst *inst, const SbAppendArgs &args,
191 LabelHolder::LabelId labelReturn, LabelHolder::LabelId labelSlowPath)
192 {
193 auto *enc = cg->GetEncoder();
194 ScopedTmpReg tmp1(enc);
195 ScopedTmpRegLazy tmp2(enc, false);
196 auto reg0 = cg->ConvertInstTmpReg(inst, DataType::REFERENCE);
197 auto reg1 = tmp1.GetReg().As(INT32_TYPE);
198 auto reg2 = INVALID_REGISTER;
199 if (args.DstCanBeUsedAsTemp() && args.Dst().GetId() != reg0.GetId()) {
200 reg2 = args.Dst().As(INT32_TYPE);
201 } else {
202 tmp2.Acquire();
203 reg2 = tmp2.GetReg().As(INT32_TYPE);
204 }
205 auto labelInsertStringIntoSlot = enc->CreateLabel();
206 auto labelFastPathDone = enc->CreateLabel();
207 auto labelIncIndex = enc->CreateLabel();
208 // Jump to slowPath if buffer is full and needs to be reallocated
209 enc->EncodeLdr(reg0, false, args.SbBufferAddr());
210 enc->EncodeLdr(reg1, false, MemRef(reg0, coretypes::Array::GetLengthOffset()));
211 enc->EncodeLdr(reg2, false, args.SbIndexAddr());
212 enc->EncodeJump(labelSlowPath, reg2, reg1, Condition::HS);
213 // Compute an address of a free slot so as not to reload SbIndex again
214 enc->EncodeShl(reg1, reg2, Imm(compiler::DataType::ShiftByType(compiler::DataType::REFERENCE, cg->GetArch())));
215 enc->EncodeAdd(reg0, reg0, Imm(coretypes::Array::GetDataOffset()));
216 enc->EncodeAdd(reg0, reg0, reg1);
217 // Process string length and compression
218 enc->EncodeLdr(reg1, false, MemRef(args.Value(), ark::coretypes::STRING_LENGTH_OFFSET));
219 // Do nothing if length of string is equal to 0.
220 // The least significant bit indicates COMPRESSED/UNCOMPRESSED,
221 // thus if (packed length <= 1) then the actual length is equal to 0.
222 enc->EncodeJump(labelFastPathDone, reg1, Imm(1), Condition::LS);
223 // Skip setting 'compress' to false if the string is compressed.
224 enc->EncodeJumpTest(labelIncIndex, reg1, Imm(1), Condition::TST_EQ);
225 // Otherwise set 'compress' to false
226 enc->EncodeSti(0, 1, args.SbCompressAddr());
227 // Increment 'index' field
228 enc->BindLabel(labelIncIndex);
229 enc->EncodeAdd(reg2, reg2, Imm(1));
230 enc->EncodeStr(reg2, args.SbIndexAddr());
231 // Unpack length of string
232 enc->EncodeShr(reg1, reg1, Imm(1));
233 // Add length of string to the current length of StringBuilder
234 enc->EncodeLdr(reg2, false, args.SbLengthAddr());
235 enc->EncodeAdd(reg2, reg2, reg1);
236 enc->EncodeStr(reg2, args.SbLengthAddr());
237 // Insert the string into the slot:
238 // - reg0 contains an address of the slot
239 // - release temps for barriers
240 enc->BindLabel(labelInsertStringIntoSlot);
241 tmp1.Release();
242 tmp2.Release();
243 EncodeSbInsertStringIntoSlot(cg, inst, reg0, args);
244 // Return the reference to StringBuilder
245 enc->BindLabel(labelFastPathDone);
246 enc->EncodeMov(args.Dst(), args.Builder());
247 enc->EncodeJump(labelReturn);
248 }
249
CreateStringBuilderAppendString(IntrinsicInst * inst,Reg dst,SRCREGS src)250 void Codegen::CreateStringBuilderAppendString(IntrinsicInst *inst, Reg dst, SRCREGS src)
251 {
252 using StringLengthType = std::result_of<decltype (&coretypes::String::GetLength)(coretypes::String)>::type;
253 static_assert(TypeInfo::GetScalarTypeBySize(sizeof(ark::ArraySizeT) * CHAR_BIT) == INT32_TYPE);
254 static_assert(TypeInfo::GetScalarTypeBySize(sizeof(StringLengthType) * CHAR_BIT) == INT32_TYPE);
255 ASSERT(GetArch() != Arch::AARCH32);
256 ASSERT(IsCompressedStringsEnabled());
257
258 auto *enc = GetEncoder();
259 auto builder = src[FIRST_OPERAND];
260 auto *strInst = inst->GetInput(1).GetInst();
261 if (strInst->IsNullPtr()) {
262 EncodeSbAppendNullString(this, inst, dst, builder);
263 return;
264 }
265 auto labelReturn = enc->CreateLabel();
266 auto labelSlowPath = enc->CreateLabel();
267 auto str = src[SECOND_OPERAND];
268 if (IsInstNotNull(strInst)) {
269 EncodeSbAppendString(this, inst, SbAppendArgs(dst, builder, str), labelReturn, labelSlowPath);
270 } else {
271 auto labelStrNotNull = enc->CreateLabel();
272 enc->EncodeJump(labelStrNotNull, str, Condition::NE);
273 EncodeSbAppendNullString(this, inst, dst, builder);
274 enc->EncodeJump(labelReturn);
275 enc->BindLabel(labelStrNotNull);
276 EncodeSbAppendString(this, inst, SbAppendArgs(dst, builder, str), labelReturn, labelSlowPath);
277 }
278 // Slow path
279 static constexpr auto ENTRYPOINT_ID = RuntimeInterface::EntrypointId::STRING_BUILDER_APPEND_STRING;
280 enc->BindLabel(labelSlowPath);
281 CallRuntime(inst, ENTRYPOINT_ID, dst, {}, builder, str);
282 // Return
283 enc->BindLabel(labelReturn);
284 }
285
CreateStringConcat(IntrinsicInst * inst,Reg dst,SRCREGS src)286 void Codegen::CreateStringConcat([[maybe_unused]] IntrinsicInst *inst, Reg dst, SRCREGS src)
287 {
288 ASSERT(IsCompressedStringsEnabled());
289 switch (inst->GetIntrinsicId()) {
290 case RuntimeInterface::IntrinsicId::INTRINSIC_STD_CORE_STRING_CONCAT2: {
291 auto str1 = src[FIRST_OPERAND];
292 auto str2 = src[SECOND_OPERAND];
293 CallFastPath(inst, EntrypointId::STRING_CONCAT2_TLAB, dst, {}, str1, str2);
294 break;
295 }
296
297 case RuntimeInterface::IntrinsicId::INTRINSIC_STD_CORE_STRING_CONCAT3: {
298 auto str1 = src[FIRST_OPERAND];
299 auto str2 = src[SECOND_OPERAND];
300 auto str3 = src[THIRD_OPERAND];
301 CallFastPath(inst, EntrypointId::STRING_CONCAT3_TLAB, dst, {}, str1, str2, str3);
302 break;
303 }
304
305 case RuntimeInterface::IntrinsicId::INTRINSIC_STD_CORE_STRING_CONCAT4: {
306 auto str1 = src[FIRST_OPERAND];
307 auto str2 = src[SECOND_OPERAND];
308 auto str3 = src[THIRD_OPERAND];
309 auto str4 = src[FOURTH_OPERAND];
310 CallFastPath(inst, EntrypointId::STRING_CONCAT4_TLAB, dst, {}, str1, str2, str3, str4);
311 break;
312 }
313
314 default:
315 UNREACHABLE();
316 break;
317 }
318 }
319
CreateStringBuilderToString(IntrinsicInst * inst,Reg dst,SRCREGS src)320 void Codegen::CreateStringBuilderToString(IntrinsicInst *inst, Reg dst, SRCREGS src)
321 {
322 ASSERT(GetArch() != Arch::AARCH32);
323 ASSERT(IsCompressedStringsEnabled());
324
325 auto *enc = GetEncoder();
326 auto entrypoint = EntrypointId::STRING_BUILDER_TO_STRING;
327 auto sb = src[FIRST_OPERAND];
328 if (GetGraph()->IsAotMode()) {
329 ScopedTmpReg klass(enc);
330 enc->EncodeLdr(klass, false, MemRef(ThreadReg(), GetRuntime()->GetStringClassPointerTlsOffset(GetArch())));
331 CallFastPath(inst, entrypoint, dst, {}, sb, klass);
332 } else {
333 auto klass = TypedImm(reinterpret_cast<uintptr_t>(GetRuntime()->GetStringClass(GetGraph()->GetMethod())));
334 CallFastPath(inst, entrypoint, dst, {}, sb, klass);
335 }
336 }
337
CreateDoubleToStringDecimal(IntrinsicInst * inst,Reg dst,SRCREGS src)338 void Codegen::CreateDoubleToStringDecimal(IntrinsicInst *inst, Reg dst, SRCREGS src)
339 {
340 ASSERT(GetArch() != Arch::AARCH32);
341 ASSERT(inst->GetInputsCount() == 4U && inst->RequireState());
342 auto cache = src[FIRST_OPERAND];
343 auto numAsInt = src[SECOND_OPERAND];
344 auto unused = src[THIRD_OPERAND];
345 auto entrypoint = EntrypointId::DOUBLE_TO_STRING_DECIMAL;
346 CallFastPath(inst, entrypoint, dst, {}, cache, numAsInt, unused);
347 }
348
349 /* See utf::IsWhiteSpaceChar() for the details */
CreateCharIsWhiteSpace(IntrinsicInst * inst,Reg dst,SRCREGS src)350 void Codegen::CreateCharIsWhiteSpace([[maybe_unused]] IntrinsicInst *inst, Reg dst, SRCREGS src)
351 {
352 ASSERT(GetArch() != Arch::AARCH32);
353 auto entrypoint = RuntimeInterface::EntrypointId::CHAR_IS_WHITE_SPACE;
354 auto ch = src[FIRST_OPERAND];
355 CallFastPath(inst, entrypoint, dst, {}, ch.As(INT16_TYPE));
356 }
357
CreateStringTrimLeft(IntrinsicInst * inst,Reg dst,SRCREGS src)358 void Codegen::CreateStringTrimLeft(IntrinsicInst *inst, Reg dst, SRCREGS src)
359 {
360 ASSERT(IsCompressedStringsEnabled());
361 auto str = src[FIRST_OPERAND];
362 auto unused = TypedImm(0);
363 // llvm backend needs unused args to call 3-args slow_path from 1-arg fast_path.
364 CallFastPath(inst, RuntimeInterface::EntrypointId::STRING_TRIM_LEFT, dst, {}, str, unused, unused);
365 }
366
CreateStringTrimRight(IntrinsicInst * inst,Reg dst,SRCREGS src)367 void Codegen::CreateStringTrimRight(IntrinsicInst *inst, Reg dst, SRCREGS src)
368 {
369 ASSERT(IsCompressedStringsEnabled());
370 auto str = src[FIRST_OPERAND];
371 auto unused = TypedImm(0);
372 // llvm backend needs unused args to call 3-args slow_path from 1-arg fast_path.
373 CallFastPath(inst, RuntimeInterface::EntrypointId::STRING_TRIM_RIGHT, dst, {}, str, unused, unused);
374 }
375
CreateStringTrim(IntrinsicInst * inst,Reg dst,SRCREGS src)376 void Codegen::CreateStringTrim(IntrinsicInst *inst, Reg dst, SRCREGS src)
377 {
378 ASSERT(IsCompressedStringsEnabled());
379 auto str = src[FIRST_OPERAND];
380 auto unused = TypedImm(0);
381 // llvm backend needs unused args to call 3-args slow_path from 1-arg fast_path.
382 CallFastPath(inst, RuntimeInterface::EntrypointId::STRING_TRIM, dst, {}, str, unused, unused);
383 }
384
385 } // namespace ark::compiler
386