/* ScummVM - Graphic Adventure Engine * * ScummVM is the legal property of its developers, whose names * are too numerous to list here. Please refer to the COPYRIGHT * file distributed with this source distribution. * * This program is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation; either version 2 * of the License, or (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. * * $URL$ * $Id$ */ #ifndef COMMON_STRING_H #define COMMON_STRING_H #include "common/scummsys.h" namespace Common { /** * Simple string class for ScummVM. Provides automatic storage managment, * and overloads several operators in a 'natural' fashion, mimicking * the std::string class. Even provides simple iterators. * * This class tries to avoid allocating lots of small blocks on the heap, * since that is inefficient on several platforms supported by ScummVM. * Instead, small strings are stored 'inside' the string object (i.e. on * the stack, for stack allocated objects), and only for strings exceeding * a certain length do we allocate a buffer on the heap. */ class String { protected: /** * The size of the internal storage. Increasing this means less heap * allocations are needed, at the cost of more stack memory usage, * and of course lots of wasted memory. Empirically, 90% or more of * all String instances are less than 32 chars long. If a platform * is very short on stack space, it would be possible to lower this. * A value of 24 still seems acceptable, though considerably worse, * while 16 seems to be the lowest you want to go... Anything lower * than 8 makes no sense, since that's the size of member _extern * (on 32 bit machines; 12 bytes on systems with 64bit pointers). */ static const uint32 _builtinCapacity = 32 - sizeof(uint32) - sizeof(char *); /** * Length of the string. Stored to avoid having to call strlen * a lot. Yes, we limit ourselves to strings shorter than 4GB -- * on purpose :-). */ uint32 _size; /** * Pointer to the actual string storage. Either points to _storage, * or to a block allocated on the heap via malloc. */ char *_str; union { /** * Internal string storage. */ char _storage[_builtinCapacity]; /** * External string storage data -- the refcounter, and the * capacity of the string _str points to. */ struct { mutable int *_refCount; uint32 _capacity; } _extern; }; inline bool isStorageIntern() const { return _str == _storage; } public: /** Construct a new empty string. */ String() : _size(0), _str(_storage) { _storage[0] = 0; } /** Construct a new string from the given NULL-terminated C string. */ String(const char *str); /** Construct a new string containing exactly len characters read from address str. */ String(const char *str, uint32 len); /** Construct a new string containing the characters between beginP (including) and endP (excluding). */ String(const char *beginP, const char *endP); /** Construct a copy of the given string. */ String(const String &str); /** Construct a string consisting of the given character. */ explicit String(char c); ~String(); String &operator=(const char *str); String &operator=(const String &str); String &operator=(char c); String &operator+=(const char *str); String &operator+=(const String &str); String &operator+=(char c); bool operator==(const String &x) const; bool operator==(const char *x) const; bool operator!=(const String &x) const; bool operator!=(const char *x) const; bool operator<(const String &x) const; bool operator<=(const String &x) const; bool operator>(const String &x) const; bool operator>=(const String &x) const; bool equals(const String &x) const; bool equalsIgnoreCase(const String &x) const; int compareTo(const String &x) const; // strcmp clone int compareToIgnoreCase(const String &x) const; // stricmp clone bool equals(const char *x) const; bool equalsIgnoreCase(const char *x) const; int compareTo(const char *x) const; // strcmp clone int compareToIgnoreCase(const char *x) const; // stricmp clone bool hasSuffix(const String &x) const; bool hasSuffix(const char *x) const; bool hasPrefix(const String &x) const; bool hasPrefix(const char *x) const; bool contains(const String &x) const; bool contains(const char *x) const; bool contains(char x) const; /** * Simple DOS-style pattern matching function (understands * and ? like used in DOS). * Taken from exult/files/listfiles.cc * * Token meaning: * "*": any character, any amount of times. * "?": any character, only once. * * Example strings/patterns: * String: monkey.s01 Pattern: monkey.s?? => true * String: monkey.s101 Pattern: monkey.s?? => false * String: monkey.s99 Pattern: monkey.s?1 => false * String: monkey.s101 Pattern: monkey.s* => true * String: monkey.s99 Pattern: monkey.s*1 => false * * @param str Text to be matched against the given pattern. * @param pat Glob pattern. * @param ignoreCase Whether to ignore the case when doing pattern match * @param pathMode Whether to use path mode, i.e., whether slashes must be matched explicitly. * * @return true if str matches the pattern, false otherwise. */ bool matchString(const char *pat, bool ignoreCase = false, bool pathMode = false) const; bool matchString(const String &pat, bool ignoreCase = false, bool pathMode = false) const; inline const char *c_str() const { return _str; } inline uint size() const { return _size; } inline bool empty() const { return (_size == 0); } char lastChar() const { return (_size > 0) ? _str[_size - 1] : 0; } char operator[](int idx) const { assert(_str && idx >= 0 && idx < (int)_size); return _str[idx]; } /** Remove the last character from the string. */ void deleteLastChar(); /** Remove the character at position p from the string. */ void deleteChar(uint32 p); /** Set character c at position p, replacing the previous character there. */ void setChar(char c, uint32 p); /** Insert character c before position p. */ void insertChar(char c, uint32 p); /** Clears the string, making it empty. */ void clear(); /** Convert all characters in the string to lowercase. */ void toLowercase(); /** Convert all characters in the string to uppercase. */ void toUppercase(); /** * Removes trailing and leading whitespaces. Uses isspace() to decide * what is whitespace and what not. */ void trim(); uint hash() const; /** * Printf-like function. Returns a formatted String. */ static Common::String printf(const char *fmt, ...) GCC_PRINTF(1,2); public: typedef char * iterator; typedef const char * const_iterator; iterator begin() { return _str; } iterator end() { return begin() + size(); } const_iterator begin() const { return _str; } const_iterator end() const { return begin() + size(); } protected: void makeUnique(); void ensureCapacity(uint32 new_size, bool keep_old); void incRefCount() const; void decRefCount(int *oldRefCount); void initWithCStr(const char *str, uint32 len); }; // Append two strings to form a new (temp) string String operator+(const String &x, const String &y); String operator+(const char *x, const String &y); String operator+(const String &x, const char *y); String operator+(const String &x, char y); String operator+(char x, const String &y); // Some useful additional comparison operators for Strings bool operator==(const char *x, const String &y); bool operator!=(const char *x, const String &y); // Utility functions to remove leading and trailing whitespaces extern char *ltrim(char *t); extern char *rtrim(char *t); extern char *trim(char *t); /** * Returns the last component of a given path. * * Examples: * /foo/bar.txt would return 'bar.txt' * /foo/bar/ would return 'bar' * /foo/./bar// would return 'bar' * * @param path the path of which we want to know the last component * @param sep character used to separate path components * @return The last component of the path. */ Common::String lastPathComponent(const Common::String &path, const char sep); /** * Normalize a gien path to a canonical form. In particular: * - trailing separators are removed: /foo/bar/ -> /foo/bar * - double separators (= empty components) are removed: /foo//bar -> /foo/bar * - dot components are removed: /foo/./bar -> /foo/bar * * @todo remove double dot components: /foo/baz/../bar -> /foo/bar * * @param path the path to normalize * @param sep the separator token (usually '/' on Unix-style systems, or '\\' on Windows based stuff) * @return the normalized path */ Common::String normalizePath(const Common::String &path, const char sep); /** * Simple DOS-style pattern matching function (understands * and ? like used in DOS). * Taken from exult/files/listfiles.cc * * Token meaning: * "*": any character, any amount of times. * "?": any character, only once. * * Example strings/patterns: * String: monkey.s01 Pattern: monkey.s?? => true * String: monkey.s101 Pattern: monkey.s?? => false * String: monkey.s99 Pattern: monkey.s?1 => false * String: monkey.s101 Pattern: monkey.s* => true * String: monkey.s99 Pattern: monkey.s*1 => false * * @param str Text to be matched against the given pattern. * @param pat Glob pattern. * @param ignoreCase Whether to ignore the case when doing pattern match * @param pathMode Whether to use path mode, i.e., whether slashes must be matched explicitly. * * @return true if str matches the pattern, false otherwise. */ bool matchString(const char *str, const char *pat, bool ignoreCase = false, bool pathMode = false); /** * Take a 32 bit value and turn it into a four character string, where each of * the four bytes is turned into one character. Most significant byte is printed * first. */ String tag2string(uint32 tag); /** * Copy up to size - 1 characters from src to dst and also zero terminate the * result. Note that src must be a zero terminated string. * * In case size is zero this function just returns the length of the source * string. * * @note This is modeled after OpenBSD's strlcpy. See the manpage here: * http://www.openbsd.org/cgi-bin/man.cgi?query=strlcpy * * @param dst The destination buffer. * @param src The source string. * @param size The size of the destination buffer. * @return The length of the (non-truncated) result, i.e. strlen(src). */ size_t strlcpy(char *dst, const char *src, size_t size); /** * Append the string src to the string dst. Note that both src and dst must be * zero terminated. The result will be zero terminated. At most * "size - strlen(dst) - 1" bytes will be appended. * * In case the dst string does not contain a zero within the first "size" bytes * the dst string will not be changed and size + strlen(src) is returned. * * @note This is modeled after OpenBSD's strlcat. See the manpage here: * http://www.openbsd.org/cgi-bin/man.cgi?query=strlcat * * @param dst The string the source string should be appended to. * @param src The source string. * @param size The (total) size of the destination buffer. * @return The length of the (non-truncated) result. That is * strlen(dst) + strlen(src). In case strlen(dst) > size * size + strlen(src) is returned. */ size_t strlcat(char *dst, const char *src, size_t size); /** * Convenience wrapper for tag2string which "returns" a C string. * Note: It is *NOT* safe to do anything with the return value other than directly * copying or printing it. */ #define tag2str(x) Common::tag2string(x).c_str() } // End of namespace Common #endif