tokio-rs · danburkert · Jun 11, 2019 · Jun 9, 2019 · Jun 9, 2019 · Jun 10, 2019
diff --git a/src/encoding.rs b/src/encoding.rs
@@ -716,6 +716,44 @@ macro_rules! length_delimited {
 pub mod string {
     use super::*;
 
+    // String::as_mut_vec is unsafe because it doesn't check that the bytes
+    // inserted into the resulting vec are valid UTF-8. We check
+    // after fully extending the buffer in order to ensure this is safe.
+    // If an unwind happens before the check is performed and the result
+    // is committed, the string is truncated to the previously valid length.
+    struct StringGuard<'a> {
+        string: &'a mut String,
+        committed_len: usize,
+    }
+
+    impl<'a> Drop for StringGuard<'a> {
+        fn drop(&mut self) {
+            self.string.truncate(self.committed_len);
+        }
+    }
+
+    impl<'a> StringGuard<'a> {
+        fn new(string: &'a mut String) -> Self {
+            let committed_len = string.len();
+            StringGuard {
+                string,
+                committed_len,
+            }
+        }
+
+        unsafe fn as_mut_vec(&mut self) -> &mut Vec<u8> {
+            self.string.as_mut_vec()
+        }
+
+        fn commit(mut self) -> Result<(), DecodeError> {
+            let new_bytes = &self.string.as_bytes()[self.committed_len..];
+            str::from_utf8(new_bytes)
+                .map_err(|_| DecodeError::new("invalid string value: data is not UTF-8 encoded"))?;
+            self.committed_len += new_bytes.len();
+            Ok(())
+        }
+    }
+
     pub fn encode<B>(tag: u32, value: &String, buf: &mut B)
     where
         B: BufMut,
@@ -728,14 +766,11 @@ pub mod string {
     where
         B: Buf,
     {
+        let mut guard = StringGuard::new(value);
         unsafe {
-            // String::as_mut_vec is unsafe because it doesn't check that the bytes
-            // inserted into it the resulting vec are valid UTF-8. We check
-            // explicitly in order to ensure this is safe.
-            super::bytes::merge(wire_type, value.as_mut_vec(), buf)?;
-            str::from_utf8(value.as_bytes())
-                .map_err(|_| DecodeError::new("invalid string value: data is not UTF-8 encoded"))?;
+            super::bytes::merge(wire_type, guard.as_mut_vec(), buf)?;
         }
+        guard.commit()?;
         Ok(())
     }
 
@@ -1307,6 +1342,15 @@ mod test {
         }
     }
 
+    #[test]
+    fn string_merge_failure() {
+        let mut s = String::new();
+        let mut buf = Cursor::new(b"\x80\x80");
+        let r = string::merge(WireType::LengthDelimited, &mut s, &mut buf);
+        r.expect_err("must be an error");
+        assert!(s.is_empty());
+    }
+
     #[test]
     fn varint() {
         fn check(value: u64, encoded: &[u8]) {