apache · srowen · Jun 16, 2019 · Jun 16, 2019 · Jun 17, 2019 · MaxGekk
diff --git a/common/unsafe/src/main/java/org/apache/spark/unsafe/types/UTF8String.java b/common/unsafe/src/main/java/org/apache/spark/unsafe/types/UTF8String.java
@@ -534,12 +534,16 @@ public UTF8String trim() {
     // skip all of the space (0x20) in the left side
     while (s < this.numBytes && getByte(s) == 0x20) s++;
     if (s == this.numBytes) {
-      // empty string
+      // Everything trimmed
       return EMPTY_UTF8;
     }
     // skip all of the space (0x20) in the right side
     int e = this.numBytes - 1;
     while (e > s && getByte(e) == 0x20) e--;
+    if (s == 0 && e == numBytes - 1) {
+      // Nothing trimmed
+      return this;
+    }
     return copyUTF8String(s, e);
   }
 
@@ -562,12 +566,15 @@ public UTF8String trimLeft() {
     int s = 0;
     // skip all of the space (0x20) in the left side
     while (s < this.numBytes && getByte(s) == 0x20) s++;
+    if (s == 0) {
+      // Nothing trimmed
+      return this;
+    }
     if (s == this.numBytes) {
-      // empty string
+      // Everything trimmed
       return EMPTY_UTF8;
-    } else {
-      return copyUTF8String(s, this.numBytes - 1);
     }
+    return copyUTF8String(s, this.numBytes - 1);
   }
 
   /**
@@ -597,26 +604,30 @@ public UTF8String trimLeft(UTF8String trimString) {
       }
       srchIdx += searchCharBytes;
     }
-
+    if (srchIdx == 0) {
+      // Nothing trimmed
+      return this;
+    }
     if (trimIdx >= numBytes) {
-      // empty string
+      // Everything trimmed
       return EMPTY_UTF8;
-    } else {
-      return copyUTF8String(trimIdx, numBytes - 1);
     }
+    return copyUTF8String(trimIdx, numBytes - 1);
   }
 
   public UTF8String trimRight() {
     int e = numBytes - 1;
     // skip all of the space (0x20) in the right side
     while (e >= 0 && getByte(e) == 0x20) e--;
-
+    if (e == numBytes - 1) {
+      // Nothing trimmed
+      return this;
+    }
     if (e < 0) {
-      // empty string
+      // Everything trimmed
       return EMPTY_UTF8;
-    } else {
-      return copyUTF8String(0, e);
     }
+    return copyUTF8String(0, e);
   }
 
   /**
@@ -658,12 +669,15 @@ public UTF8String trimRight(UTF8String trimString) {
       numChars --;
     }
 
+    if (trimEnd == numBytes - 1) {
+      // Nothing trimmed
+      return this;
+    }
     if (trimEnd < 0) {
-      // empty string
+      // Everything trimmed
       return EMPTY_UTF8;
-    } else {
-      return copyUTF8String(0, trimEnd);
     }
+    return copyUTF8String(0, trimEnd);
   }
 
   public UTF8String reverse() {