Add UTF-8 validation function and validate input to libIDN functions

This is required to protect against the CVE-2015-2059 vulnerability in libIDN. Test-Information: Added unit tests for UTF-8 validation and tested that existing unit tests still pass. Change-Id: I0a94136894c6e0004081456c59155a78a3dabf5f
author: Tobias Markmann <tm@ayena.de> 2015-09-17 08:14:57 (GMT)
committer: Swift Review <review@swift.im> 2015-10-16 10:38:19 (GMT)
commit: 3a2b966711dbe6fa937c485d7ad56916219badb2 (patch)
tree: 30e9f30bc3f2a3ca6b4ed0c5c11f4ae0703485d0 /Swiften/IDN/UTF8Validator.h
parent: 582ca915b5b82ada46d1183a7b882455ee01b7b1 (diff)
download: swift-3a2b966711dbe6fa937c485d7ad56916219badb2.zip
swift-3a2b966711dbe6fa937c485d7ad56916219badb2.tar.bz2
1 files changed, 67 insertions, 0 deletions
diff --git a/Swiften/IDN/UTF8Validator.h b/Swiften/IDN/UTF8Validator.h
new file mode 100644
index 0000000..5df8769
--- /dev/null
+++ b/Swiften/IDN/UTF8Validator.h
@@ -0,0 +1,67 @@
+/*
+ * Copyright (c) 2015 Isode Limited.
+ * All rights reserved.
+ * See the COPYING file for more information.
+ */
+
+#pragma once
+
+#include <cstddef>
+
+namespace Swift {
+
+// UTF-8 validation based on the description in https://tools.ietf.org/html/rfc3629#section-3 .
+template <typename CharType>
+bool UTF8IsValid(const CharType* data, size_t length) {
+	bool isValid = true;
+	const CharType* current = data;
+	const CharType* end = data + length;
+	while (isValid && (current < end)) {
+		// one byte sequences
+		if ((*current & 0x80) == 0x0) {
+			current++;
+			continue;
+		}
+		// longer byte sequences
+		else {
+			// two byte sequences
+			if ((*current & 0xE0) == 0xC0) {
+				current++;
+				if ( (current < end) && ((*current & 0xC0) == 0x80) ) {
+					current++;
+					continue;
+				}
+			}
+			// three byte sequences
+			else if ((*current & 0xF0) == 0xE0) {
+				current++;
+				if ( ((current + 1) < end) && ((*current & 0xC0) == 0x80) ) {
+					current++;
+					if ((*current & 0xC0) == 0x80) {
+						current++;
+						continue;
+					}
+				}
+			}
+			// four byte sequences
+			else if ((*current & 0xF8) == 0xF0) {
+				current++;
+				if ( ((current + 2) < end) && ((*current & 0xC0) == 0x80) ) {
+					current++;
+					if ((*current & 0xC0) == 0x80) {
+						current++;
+						if ((*current & 0xC0) == 0x80) {
+							current++;
+							continue;
+						}
+					}
+				}
+			}
+			// invalid sequences
+			isValid = false;
+		}
+	}
+	return isValid;
+}
+
+}
author	Tobias Markmann <tm@ayena.de>	2015-09-17 08:14:57 (GMT)
committer	Swift Review <review@swift.im>	2015-10-16 10:38:19 (GMT)
commit	3a2b966711dbe6fa937c485d7ad56916219badb2 (patch)
tree	30e9f30bc3f2a3ca6b4ed0c5c11f4ae0703485d0 /Swiften/IDN/UTF8Validator.h
parent	582ca915b5b82ada46d1183a7b882455ee01b7b1 (diff)
download	swift-3a2b966711dbe6fa937c485d7ad56916219badb2.zip swift-3a2b966711dbe6fa937c485d7ad56916219badb2.tar.bz2