summaryrefslogtreecommitdiffstats
blob: 17d49c273d5bb40cfdc8d84cb98585d906b18900 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
/*
 * Copyright (c) 2010 Remko Tronçon
 * Licensed under the GNU General Public License v3.
 * See Documentation/Licenses/GPLv3.txt for more information.
 */

#include <cassert>
#include <algorithm>

#include "Swiften/Base/String.h"

namespace Swift {

static inline size_t sequenceLength(char firstByte) {
	if ((firstByte & 0x80) == 0) {
		return 1;
	}
	if ((firstByte & 0xE0) == 0xC0) {
		return 2;
	}
	if ((firstByte & 0xF0) == 0xE0) {
		return 3;
	}
	if ((firstByte & 0xF8) == 0xF0) {
		return 4;
	}
	if ((firstByte & 0xFC) == 0xF8) {
		return 5;
	}
	if ((firstByte & 0xFE) == 0xFC) {
		return 6;
	}
	assert(false);
	return 1;
}

std::vector<unsigned int> String::getUnicodeCodePoints() const {
	std::vector<unsigned int> result;
	for (size_t i = 0; i < data_.size();) {
		unsigned int codePoint = 0;
		char firstChar = data_[i];
		size_t length = sequenceLength(firstChar);

		// First character is special
		size_t firstCharBitSize = 7 - length;
		if (length == 1) {
			firstCharBitSize = 7;
		}
		codePoint = firstChar & ((1<<(firstCharBitSize+1)) - 1);

		for (size_t j = 1; j < length; ++j) {
			codePoint = (codePoint<<6) | (data_[i+j] & 0x3F);
		}
		result.push_back(codePoint);
		i += length;
	}
	return result;
}


std::pair<String,String> String::getSplittedAtFirst(char c) const {
	assert((c & 0x80) == 0);
	size_t firstMatch = data_.find(c);
	if (firstMatch != data_.npos) {
		return std::make_pair(data_.substr(0,firstMatch),data_.substr(firstMatch+1,data_.npos));
	}
	else {
		return std::make_pair(*this, "");
	}
}

size_t String::getLength() const {
	size_t size = 0, current = 0, end = data_.size();
	while (current < end) {
		size++;
		current += sequenceLength(data_[current]);
	}
	return size;
}

void String::removeAll(char c) {
	size_t lastPos = 0;
	size_t matchingIndex = 0;
	while ((matchingIndex = data_.find(c, lastPos)) != data_.npos) {
		data_.erase(matchingIndex, 1);
		lastPos = matchingIndex;
	}
}

void String::replaceAll(char c, const String& s) {
	size_t lastPos = 0;
	size_t matchingIndex = 0;
	while ((matchingIndex = data_.find(c, lastPos)) != data_.npos) {
		data_.replace(matchingIndex, 1, s.data_);
		lastPos = matchingIndex + s.data_.size();
	}
}

std::vector<String> String::split(char c) const {
	assert((c & 0x80) == 0);
	std::vector<String> result;
	String accumulator;
	for (size_t i = 0; i < data_.size(); ++i) {
		if (data_[i] == c) {
			result.push_back(accumulator);
			accumulator = "";
		}
		else {
			accumulator += data_[i];
		}
	}
	result.push_back(accumulator);
	return result;
}

}