dart-lang
diff --git a/‎runtime/tests/vm/dart/string_equals_test.dart
Lines changed: 44 additions & 0 deletions b/‎runtime/tests/vm/dart/string_equals_test.dart
Lines changed: 44 additions & 0 deletions
diff --git a/‎runtime/tests/vm/dart_2/string_equals_test.dart
Lines changed: 46 additions & 0 deletions b/‎runtime/tests/vm/dart_2/string_equals_test.dart
Lines changed: 46 additions & 0 deletions
diff --git a/‎runtime/vm/app_snapshot.cc
Lines changed: 26 additions & 1 deletion b/‎runtime/vm/app_snapshot.cc
Lines changed: 26 additions & 1 deletion
diff --git a/‎runtime/vm/compiler/asm_intrinsifier_arm.cc
Lines changed: 27 additions & 20 deletions b/‎runtime/vm/compiler/asm_intrinsifier_arm.cc
Lines changed: 27 additions & 20 deletions
diff --git a/‎runtime/vm/compiler/asm_intrinsifier_arm64.cc
Lines changed: 32 additions & 25 deletions b/‎runtime/vm/compiler/asm_intrinsifier_arm64.cc
Lines changed: 32 additions & 25 deletions
diff --git a/‎runtime/vm/compiler/asm_intrinsifier_ia32.cc
Lines changed: 26 additions & 20 deletions b/‎runtime/vm/compiler/asm_intrinsifier_ia32.cc
Lines changed: 26 additions & 20 deletions
@@ -0,0 +1,44 @@
+// Copyright (c) 2022, the Dart project authors.  Please see the AUTHORS file
+// for details. All rights reserved. Use of this source code is governed by a
+// BSD-style license that can be found in the LICENSE file.
+//
+// Verifies that string equal implementation correctly handles strings of
+// various lengths.
+
+import 'dart:math';
+
+import "package:expect/expect.dart";
+
+compare(List<int> ints, String s_piece, String t_piece, bool expectedEquality) {
+  final s = String.fromCharCodes(ints);
+  String s_mid = s + s_piece + s;
+  String t_mid = s + t_piece + s;
+  Expect.isFalse(identical(s_mid, t_mid));
+  Expect.equals(s_mid == t_mid, expectedEquality);
+  String s_tail = s + s_piece;
+  String t_tail = s + t_piece;
+  Expect.isFalse(identical(s_tail, t_tail));
+  Expect.equals(s_tail == t_tail, expectedEquality);
+  String s_head = s_piece + s;
+  String t_head = t_piece + s;
+  Expect.isFalse(identical(s_head, t_head));
+  Expect.equals(s_head == t_head, expectedEquality);
+}
+
+main() {
+  const int maxStringLength = 128;
+  // OneByteString
+  for (int i = 0; i < maxStringLength; i++) {
+    final l = List.generate(i, (n) => (Random().nextInt(30) + 40));
+    compare(l, 'a', 'b', false);
+    compare(l, 'a', 'a', true);
+  }
+  // TwoByteString
+  for (int i = 0; i < maxStringLength; i++) {
+    final l = List.generate(i, (n) => (Random().nextInt(1024) + 1024));
+    compare(l, String.fromCharCodes(<int>[1042]),
+        String.fromCharCodes(<int>[1043]), false);
+    compare(l, String.fromCharCodes(<int>[1042]),
+        String.fromCharCodes(<int>[1042]), true);
+  }
+}
@@ -0,0 +1,46 @@
+// Copyright (c) 2022, the Dart project authors.  Please see the AUTHORS file
+// for details. All rights reserved. Use of this source code is governed by a
+// BSD-style license that can be found in the LICENSE file.
+//
+// @dart = 2.9
+//
+// Verifies that string equal implementation correctly handles strings of
+// various lengths.
+
+import 'dart:math';
+
+import "package:expect/expect.dart";
+
+compare(List<int> ints, String s_piece, String t_piece, bool expectedEquality) {
+  final s = String.fromCharCodes(ints);
+  String s_mid = s + s_piece + s;
+  String t_mid = s + t_piece + s;
+  Expect.isFalse(identical(s_mid, t_mid));
+  Expect.equals(s_mid == t_mid, expectedEquality);
+  String s_tail = s + s_piece;
+  String t_tail = s + t_piece;
+  Expect.isFalse(identical(s_tail, t_tail));
+  Expect.equals(s_tail == t_tail, expectedEquality);
+  String s_head = s_piece + s;
+  String t_head = t_piece + s;
+  Expect.isFalse(identical(s_head, t_head));
+  Expect.equals(s_head == t_head, expectedEquality);
+}
+
+main() {
+  const int maxStringLength = 128;
+  // OneByteString
+  for (int i = 0; i < maxStringLength; i++) {
+    final l = List.generate(i, (n) => (Random().nextInt(30) + 40));
+    compare(l, 'a', 'b', false);
+    compare(l, 'a', 'a', true);
+  }
+  // TwoByteString
+  for (int i = 0; i < maxStringLength; i++) {
+    final l = List.generate(i, (n) => (Random().nextInt(1024) + 1024));
+    compare(l, String.fromCharCodes(<int>[1042]),
+        String.fromCharCodes(<int>[1043]), false);
+    compare(l, String.fromCharCodes(<int>[1042]),
+        String.fromCharCodes(<int>[1042]), true);
+  }
+}
@@ -5977,16 +5977,41 @@ class StringDeserializationCluster
       const intptr_t encoded = d.ReadUnsigned();
       intptr_t cid = 0;
       const intptr_t length = DecodeLengthAndCid(encoded, &cid);
-      Deserializer::InitializeHeader(str, cid, InstanceSize(length, cid),
+      const intptr_t instance_size = InstanceSize(length, cid);
+      // Clean up last two words of the string object to simplify future
+      // string comparisons.
+      // Objects are rounded up to two-word size boundary.
+      *reinterpret_cast<word*>(reinterpret_cast<uint8_t*>(str->untag()) +
+                               instance_size - 1 * kWordSize) = 0;
+      *reinterpret_cast<word*>(reinterpret_cast<uint8_t*>(str->untag()) +
+                               instance_size - 2 * kWordSize) = 0;
+      Deserializer::InitializeHeader(str, cid, instance_size,
                                      primary && is_canonical());
+#if DART_COMPRESSED_POINTERS
+      // Gap caused by less-than-a-word length_ smi sitting before data_.
+      const intptr_t length_offset =
+          reinterpret_cast<intptr_t>(&str->untag()->length_);
+      const intptr_t data_offset =
+          cid == kOneByteStringCid
+              ? reinterpret_cast<intptr_t>(
+                    static_cast<OneByteStringPtr>(str)->untag()->data())
+              : reinterpret_cast<intptr_t>(
+                    static_cast<TwoByteStringPtr>(str)->untag()->data());
+      const intptr_t length_with_gap = data_offset - length_offset;
+      ASSERT(length_with_gap > kCompressedWordSize);
+      ASSERT(length_with_gap == kWordSize);
+      memset(reinterpret_cast<void*>(length_offset), 0, length_with_gap);
+#endif
       str->untag()->length_ = Smi::New(length);
+
       StringHasher hasher;
       if (cid == kOneByteStringCid) {
         for (intptr_t j = 0; j < length; j++) {
           uint8_t code_unit = d.Read<uint8_t>();
           static_cast<OneByteStringPtr>(str)->untag()->data()[j] = code_unit;
           hasher.Add(code_unit);
         }
+
       } else {
         for (intptr_t j = 0; j < length; j++) {
           uint16_t code_unit = d.Read<uint8_t>();
 
@@ -1572,6 +1572,12 @@ static void TryAllocateString(Assembler* assembler,
   // next object start and initialize the object.
   __ str(R1, Address(THR, target::Thread::top_offset()));
   __ AddImmediate(R0, kHeapObjectTag);
+  // Clear last double word to ensure string comparison doesn't need to
+  // specially handle remainder of strings with lengths not factors of double
+  // offsets.
+  __ LoadImmediate(TMP, 0);
+  __ str(TMP, Address(R1, -1 * target::kWordSize));
+  __ str(TMP, Address(R1, -2 * target::kWordSize));
 
   // Initialize the tags.
   // R0: new object start as a tagged pointer.
@@ -1726,7 +1732,7 @@ static void StringEquality(Assembler* assembler,
   __ cmp(R0, Operand(R1));
   __ b(&is_true, EQ);
 
-  // Is other OneByteString?
+  // Is other same kind of string?
   __ tst(R1, Operand(kSmiTagMask));
   __ b(normal_ir_body, EQ);
   __ CompareClassId(R1, string_cid, R2);
@@ -1742,29 +1748,30 @@ static void StringEquality(Assembler* assembler,
   // TODO(zra): try out other sequences.
   ASSERT((string_cid == kOneByteStringCid) ||
          (string_cid == kTwoByteStringCid));
-  const intptr_t offset = (string_cid == kOneByteStringCid)
-                              ? target::OneByteString::data_offset()
-                              : target::TwoByteString::data_offset();
-  __ AddImmediate(R0, offset - kHeapObjectTag);
-  __ AddImmediate(R1, offset - kHeapObjectTag);
-  __ SmiUntag(R2);
+  if (string_cid == kOneByteStringCid) {
+    __ SmiUntag(R2);
+  }
+  // R2 is length of data in bytes.
+  // Round up number of bytes to compare to word boundary since we
+  // are doing comparison in word chunks.
+  __ AddImmediate(R2, target::kWordSize - 1);
+  __ LsrImmediate(R2, R2, target::kWordSizeLog2);
+  ASSERT(target::OneByteString::data_offset() ==
+         target::String::length_offset() + target::kWordSize);
+  ASSERT(target::TwoByteString::data_offset() ==
+         target::String::length_offset() + target::kWordSize);
+  COMPILE_ASSERT(target::kWordSize == 4);
+  __ AddImmediate(
+      R0, target::String::length_offset() + target::kWordSize - kHeapObjectTag);
+  __ AddImmediate(
+      R1, target::String::length_offset() + target::kWordSize - kHeapObjectTag);
+
   __ Bind(&loop);
   __ AddImmediate(R2, -1);
   __ cmp(R2, Operand(0));
   __ b(&is_true, LT);
-  if (string_cid == kOneByteStringCid) {
-    __ ldrb(R3, Address(R0));
-    __ ldrb(R4, Address(R1));
-    __ AddImmediate(R0, 1);
-    __ AddImmediate(R1, 1);
-  } else if (string_cid == kTwoByteStringCid) {
-    __ ldrh(R3, Address(R0));
-    __ ldrh(R4, Address(R1));
-    __ AddImmediate(R0, 2);
-    __ AddImmediate(R1, 2);
-  } else {
-    UNIMPLEMENTED();
-  }
+  __ ldr(R3, Address(R0, 4, Address::PostIndex));
+  __ ldr(R4, Address(R1, 4, Address::PostIndex));
   __ cmp(R3, Operand(R4));
   __ b(&is_false, NE);
   __ b(&loop);
 
@@ -1789,6 +1789,10 @@ static void TryAllocateString(Assembler* assembler,
   // next object start and initialize the object.
   __ str(R1, Address(THR, target::Thread::top_offset()));
   __ AddImmediate(R0, kHeapObjectTag);
+  // Clear last double word to ensure string comparison doesn't need to
+  // specially handle remainder of strings with lengths not factors of double
+  // offsets.
+  __ stp(ZR, ZR, Address(R1, -2 * target::kWordSize, Address::PairOffset));
 
   // Initialize the tags.
   // R0: new object start as a tagged pointer.
@@ -1812,6 +1816,10 @@ static void TryAllocateString(Assembler* assembler,
     __ str(R2, FieldAddress(R0, target::Object::tags_offset()));  // Store tags.
   }
 
+#if DART_COMPRESSED_POINTERS
+  // Clear out padding caused by alignment gap between length and data.
+  __ str(ZR, FieldAddress(R0, target::String::length_offset()));
+#endif
   // Set the length field using the saved length (R6).
   __ StoreCompressedIntoObjectNoBarrier(
       R0, FieldAddress(R0, target::String::length_offset()), R6);
@@ -1953,44 +1961,43 @@ static void StringEquality(Assembler* assembler,
   __ CompareObjectRegisters(R0, R1);
   __ b(&is_true, EQ);
 
-  // Is other OneByteString?
+  // Is other same kind of string?
   __ BranchIfSmi(R1, normal_ir_body);
   __ CompareClassId(R1, string_cid);
   __ b(normal_ir_body, NE);
 
   // Have same length?
-  __ LoadCompressedSmi(R2, FieldAddress(R0, target::String::length_offset()));
-  __ LoadCompressedSmi(R3, FieldAddress(R1, target::String::length_offset()));
-  __ CompareObjectRegisters(R2, R3);
+  __ ldr(R2, FieldAddress(R0, target::String::length_offset()));
+  __ ldr(R3, FieldAddress(R1, target::String::length_offset()));
+  __ CompareRegisters(R2, R3);
   __ b(&is_false, NE);
 
-  // Check contents, no fall-through possible.
-  // TODO(zra): try out other sequences.
   ASSERT((string_cid == kOneByteStringCid) ||
          (string_cid == kTwoByteStringCid));
-  const intptr_t offset = (string_cid == kOneByteStringCid)
-                              ? target::OneByteString::data_offset()
-                              : target::TwoByteString::data_offset();
-  __ AddImmediate(R0, offset - kHeapObjectTag);
-  __ AddImmediate(R1, offset - kHeapObjectTag);
-  __ SmiUntag(R2);
+  if (string_cid == kOneByteStringCid) {
+    __ SmiUntag(R2);
+  }
+  // R2 is length of data in bytes.
+  // Round up number of bytes to compare to word boundary since we
+  // are doing comparison in word chunks.
+  __ AddImmediate(R2, target::kWordSize - 1);
+  __ LsrImmediate(R2, R2, target::kWordSizeLog2);
+  ASSERT(target::OneByteString::data_offset() ==
+         target::String::length_offset() + target::kWordSize);
+  ASSERT(target::TwoByteString::data_offset() ==
+         target::String::length_offset() + target::kWordSize);
+  COMPILE_ASSERT(target::kWordSize == 8);
+  __ AddImmediate(
+      R0, target::String::length_offset() + target::kWordSize - kHeapObjectTag);
+  __ AddImmediate(
+      R1, target::String::length_offset() + target::kWordSize - kHeapObjectTag);
+
   __ Bind(&loop);
   __ AddImmediate(R2, -1);
   __ CompareRegisters(R2, ZR);
   __ b(&is_true, LT);
-  if (string_cid == kOneByteStringCid) {
-    __ ldr(R3, Address(R0), kUnsignedByte);
-    __ ldr(R4, Address(R1), kUnsignedByte);
-    __ AddImmediate(R0, 1);
-    __ AddImmediate(R1, 1);
-  } else if (string_cid == kTwoByteStringCid) {
-    __ ldr(R3, Address(R0), kUnsignedTwoBytes);
-    __ ldr(R4, Address(R1), kUnsignedTwoBytes);
-    __ AddImmediate(R0, 2);
-    __ AddImmediate(R1, 2);
-  } else {
-    UNIMPLEMENTED();
-  }
+  __ ldr(R3, Address(R0, 8, Address::PostIndex));
+  __ ldr(R4, Address(R1, 8, Address::PostIndex));
   __ cmp(R3, Operand(R4));
   __ b(&is_false, NE);
   __ b(&loop);
 
@@ -1627,7 +1627,12 @@ static void TryAllocateString(Assembler* assembler,
   // next object start and initialize the object.
   __ movl(Address(THR, target::Thread::top_offset()), EBX);
   __ addl(EAX, Immediate(kHeapObjectTag));
-
+  // Clear last double word to ensure string comparison doesn't need to
+  // specially handle remainder of strings with lengths not factors of double
+  // offsets.
+  ASSERT(target::kWordSize == 4);
+  __ movl(Address(EBX, -1 * target::kWordSize), Immediate(0));
+  __ movl(Address(EBX, -2 * target::kWordSize), Immediate(0));
   // Initialize the tags.
   // EAX: new object start as a tagged pointer.
   // EBX: new object end address.
@@ -1777,7 +1782,7 @@ static void StringEquality(Assembler* assembler,
   __ cmpl(EAX, EBX);
   __ j(EQUAL, &is_true, Assembler::kNearJump);
 
-  // Is other OneByteString?
+  // Is other same kind of string?
   __ testl(EBX, Immediate(kSmiTagMask));
   __ j(ZERO, &is_false);  // Smi
   __ CompareClassId(EBX, string_cid, EDI);
@@ -1788,27 +1793,28 @@ static void StringEquality(Assembler* assembler,
   __ cmpl(EDI, FieldAddress(EBX, target::String::length_offset()));
   __ j(NOT_EQUAL, &is_false, Assembler::kNearJump);
 
-  // Check contents, no fall-through possible.
-  // TODO(srdjan): write a faster check.
-  __ SmiUntag(EDI);
+  if (string_cid == kOneByteStringCid) {
+    __ SmiUntag(EDI);
+  }
+
+  // Round up number of bytes to compare to word boundary since we
+  // are doing comparison in word chunks.
+  __ addl(EDI, Immediate(target::kWordSize - 1));
+  __ sarl(EDI, Immediate(target::kWordSizeLog2));
   __ Bind(&loop);
   __ decl(EDI);
-  __ cmpl(EDI, Immediate(0));
   __ j(LESS, &is_true, Assembler::kNearJump);
-  if (string_cid == kOneByteStringCid) {
-    __ movzxb(ECX, FieldAddress(EAX, EDI, TIMES_1,
-                                target::OneByteString::data_offset()));
-    __ movzxb(EDX, FieldAddress(EBX, EDI, TIMES_1,
-                                target::OneByteString::data_offset()));
-  } else if (string_cid == kTwoByteStringCid) {
-    __ movzxw(ECX, FieldAddress(EAX, EDI, TIMES_2,
-                                target::TwoByteString::data_offset()));
-    __ movzxw(EDX, FieldAddress(EBX, EDI, TIMES_2,
-                                target::TwoByteString::data_offset()));
-  } else {
-    UNIMPLEMENTED();
-  }
-  __ cmpl(ECX, EDX);
+  ASSERT(target::OneByteString::data_offset() ==
+         target::String::length_offset() + target::kWordSize);
+  ASSERT(target::TwoByteString::data_offset() ==
+         target::String::length_offset() + target::kWordSize);
+  COMPILE_ASSERT(target::kWordSize == 4);
+  __ movl(ECX, FieldAddress(EAX, EDI, TIMES_4,
+                            target::String::length_offset() +
+                                target::kWordSize));  // word with length itself
+  __ cmpl(ECX, FieldAddress(EBX, EDI, TIMES_4,
+                            target::String::length_offset() +
+                                target::kWordSize));  // word with length itself
   __ j(NOT_EQUAL, &is_false, Assembler::kNearJump);
   __ jmp(&loop, Assembler::kNearJump);