VirtualBox

source: vbox/trunk/include/VBox/com/string.h@ 21369

Last change on this file since 21369 was 21369, checked in by vboxsync, 16 years ago

IPRT: hide ministring::operator bool() to force people to use isEmpty() explicitly, second try

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 20.7 KB
Line 
1/* $Id: string.h 21369 2009-07-07 18:52:12Z vboxsync $ */
2
3/** @file
4 * MS COM / XPCOM Abstraction Layer:
5 * Smart string classes declaration
6 */
7
8/*
9 * Copyright (C) 2006-2009 Sun Microsystems, Inc.
10 *
11 * This file is part of VirtualBox Open Source Edition (OSE), as
12 * available from http://www.215389.xyz. This file is free software;
13 * you can redistribute it and/or modify it under the terms of the GNU
14 * General Public License (GPL) as published by the Free Software
15 * Foundation, in version 2 as it comes in the "COPYING" file of the
16 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
17 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
18 *
19 * The contents of this file may alternatively be used under the terms
20 * of the Common Development and Distribution License Version 1.0
21 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
22 * VirtualBox OSE distribution, in which case the provisions of the
23 * CDDL are applicable instead of those of the GPL.
24 *
25 * You may elect to license modified versions of this file under the
26 * terms and conditions of either the GPL or the CDDL or both.
27 *
28 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa
29 * Clara, CA 95054 USA or visit http://www.sun.com if you need
30 * additional information or have any questions.
31 */
32
33#ifndef ___VBox_com_string_h
34#define ___VBox_com_string_h
35
36/* Make sure all the stdint.h macros are included - must come first! */
37#ifndef __STDC_LIMIT_MACROS
38# define __STDC_LIMIT_MACROS
39#endif
40#ifndef __STDC_CONSTANT_MACROS
41# define __STDC_CONSTANT_MACROS
42#endif
43
44#if defined (VBOX_WITH_XPCOM)
45# include <nsMemory.h>
46#endif
47
48#include "VBox/com/defs.h"
49#include "VBox/com/assert.h"
50
51#include <iprt/cpputils.h>
52#include <iprt/alloc.h>
53#include <iprt/ministring_cpp.h>
54
55namespace com
56{
57
58class Utf8Str;
59
60/**
61 * Helper class that represents the |BSTR| type and hides platform-specific
62 * implementation details.
63 *
64 * This class uses COM/XPCOM-provided memory management routines to allocate
65 * and free string buffers. This makes it possible to:
66 * - use it as a type of member variables of COM/XPCOM components and pass
67 * their values to callers through component methods' output parameters
68 * using the #cloneTo() operation;
69 * - adopt (take ownership of) string buffers returned in output parameters
70 * of COM methods using the #asOutParam() operation and correctly free them
71 * afterwards.
72 */
73class Bstr
74{
75public:
76
77 typedef BSTR String;
78 typedef CBSTR ConstString;
79
80 Bstr () : bstr (NULL) {}
81
82 Bstr (const Bstr &that) : bstr (NULL) { raw_copy (bstr, that.bstr); }
83 Bstr (CBSTR that) : bstr (NULL) { raw_copy (bstr, that); }
84
85#if defined (VBOX_WITH_XPCOM)
86 Bstr (const wchar_t *that) : bstr (NULL)
87 {
88 AssertCompile (sizeof (wchar_t) == sizeof (OLECHAR));
89 raw_copy (bstr, (CBSTR) that);
90 }
91#endif
92
93 Bstr (const Utf8Str &that);
94 Bstr (const char *that);
95
96 /** Shortcut that calls #alloc(aSize) right after object creation. */
97 Bstr (size_t aSize) : bstr (NULL) { alloc (aSize); }
98
99 ~Bstr () { setNull(); }
100
101 Bstr &operator = (const Bstr &that) { safe_assign (that.bstr); return *this; }
102 Bstr &operator = (CBSTR that) { safe_assign (that); return *this; }
103
104 Bstr &operator = (const Utf8Str &that);
105 Bstr &operator = (const char *that);
106
107 Bstr &setNull()
108 {
109 if (bstr)
110 {
111 ::SysFreeString (bstr);
112 bstr = NULL;
113 }
114 return *this;
115 }
116
117 Bstr &setNullIfEmpty()
118 {
119 if (bstr && *bstr == 0)
120 {
121 ::SysFreeString (bstr);
122 bstr = NULL;
123 }
124 return *this;
125 }
126
127 /**
128 * Allocates memory for a string capable to store \a aSize - 1 characters;
129 * in other words, aSize includes the terminating zero character. If \a aSize
130 * is zero, or if a memory allocation error occurs, this object will become null.
131 */
132 Bstr &alloc (size_t aSize)
133 {
134 setNull();
135 if (aSize)
136 {
137 unsigned int size = (unsigned int) aSize; Assert (size == aSize);
138 bstr = ::SysAllocStringLen (NULL, size - 1);
139 if (bstr)
140 bstr [0] = 0;
141 }
142 return *this;
143 }
144
145 int compare (CBSTR str) const
146 {
147 return ::RTUtf16Cmp ((PRTUTF16) bstr, (PRTUTF16) str);
148 }
149
150 int compare (BSTR str) const
151 {
152 return ::RTUtf16Cmp ((PRTUTF16) bstr, (PRTUTF16) str);
153 }
154
155 bool operator==(const Bstr &that) const { return !compare (that.bstr); }
156 bool operator!=(const Bstr &that) const { return !!compare (that.bstr); }
157 bool operator==(CBSTR that) const { return !compare (that); }
158 bool operator==(BSTR that) const { return !compare (that); }
159
160#if defined (VBOX_WITH_XPCOM)
161 bool operator!=(const wchar_t *that) const
162 {
163 AssertCompile (sizeof (wchar_t) == sizeof (OLECHAR));
164 return !!compare ((CBSTR) that);
165 }
166 bool operator==(const wchar_t *that) const
167 {
168 AssertCompile (sizeof (wchar_t) == sizeof (OLECHAR));
169 return !compare ((CBSTR) that);
170 }
171#endif
172
173 bool operator!=(CBSTR that) const { return !!compare (that); }
174 bool operator!=(BSTR that) const { return !!compare (that); }
175 bool operator<(const Bstr &that) const { return compare (that.bstr) < 0; }
176 bool operator<(CBSTR that) const { return compare (that) < 0; }
177 bool operator<(BSTR that) const { return compare (that) < 0; }
178#if defined (VBOX_WITH_XPCOM)
179 bool operator<(const wchar_t *that) const
180 {
181 AssertCompile (sizeof (wchar_t) == sizeof (OLECHAR));
182 return compare ((CBSTR) that) < 0;
183 }
184#endif
185
186 int compareIgnoreCase (CBSTR str) const
187 {
188 return ::RTUtf16LocaleICmp (bstr, str);
189 }
190
191 bool isNull() const { return bstr == NULL; }
192 operator bool() const { return !isNull(); }
193
194 bool isEmpty() const { return isNull() || *bstr == 0; }
195
196 size_t length() const { return isNull() ? 0 : ::RTUtf16Len ((PRTUTF16) bstr); }
197
198 /** Intended to to pass instances as |CBSTR| input parameters to methods. */
199 operator CBSTR () const { return bstr; }
200
201 /**
202 * Intended to to pass instances as |BSTR| input parameters to methods.
203 * Note that we have to provide this mutable BSTR operator since in MS COM
204 * input BSTR parameters of interface methods are not const.
205 */
206 operator BSTR () { return bstr; }
207
208 /**
209 * The same as operator CBSTR(), but for situations where the compiler
210 * cannot typecast implicitly (for example, in printf() argument list).
211 */
212 CBSTR raw() const { return bstr; }
213
214 /**
215 * Returns a non-const raw pointer that allows to modify the string directly.
216 * @warning
217 * Be sure not to modify data beyond the allocated memory! The
218 * guaranteed size of the allocated memory is at least #length()
219 * bytes after creation and after every assignment operation.
220 */
221 BSTR mutableRaw() { return bstr; }
222
223 /**
224 * Intended to assign copies of instances to |BSTR| out parameters from
225 * within the interface method. Transfers the ownership of the duplicated
226 * string to the caller.
227 */
228 const Bstr &cloneTo (BSTR *pstr) const
229 {
230 if (pstr)
231 {
232 *pstr = NULL;
233 raw_copy (*pstr, bstr);
234 }
235 return *this;
236 }
237
238 /**
239 * Intended to assign instances to |BSTR| out parameters from within the
240 * interface method. Transfers the ownership of the original string to the
241 * caller and resets the instance to null.
242 *
243 * As opposed to cloneTo(), this method doesn't create a copy of the
244 * string.
245 */
246 Bstr &detachTo (BSTR *pstr)
247 {
248 *pstr = bstr;
249 bstr = NULL;
250 return *this;
251 }
252
253 /**
254 * Intended to assign copies of instances to |char *| out parameters from
255 * within the interface method. Transfers the ownership of the duplicated
256 * string to the caller.
257 */
258 const Bstr &cloneTo (char **pstr) const;
259
260 /**
261 * Intended to pass instances as |BSTR| out parameters to methods.
262 * Takes the ownership of the returned data.
263 */
264 BSTR *asOutParam() { setNull(); return &bstr; }
265
266 /**
267 * Static immutable null object. May be used for comparison purposes.
268 */
269 static const Bstr Null;
270
271protected:
272
273 void safe_assign (CBSTR str)
274 {
275 if (bstr != str)
276 {
277 setNull();
278 raw_copy (bstr, str);
279 }
280 }
281
282 inline static void raw_copy (BSTR &ls, CBSTR rs)
283 {
284 if (rs)
285 ls = ::SysAllocString ((const OLECHAR *) rs);
286 }
287
288 inline static void raw_copy (BSTR &ls, const char *rs)
289 {
290 if (rs)
291 {
292 PRTUTF16 s = NULL;
293 ::RTStrToUtf16 (rs, &s);
294 raw_copy (ls, (BSTR) s);
295 ::RTUtf16Free (s);
296 }
297 }
298
299 BSTR bstr;
300
301 friend class Utf8Str; /* to access our raw_copy() */
302};
303
304/* symmetric compare operators */
305inline bool operator==(CBSTR l, const Bstr &r) { return r.operator== (l); }
306inline bool operator!=(CBSTR l, const Bstr &r) { return r.operator!= (l); }
307inline bool operator==(BSTR l, const Bstr &r) { return r.operator== (l); }
308inline bool operator!=(BSTR l, const Bstr &r) { return r.operator!= (l); }
309
310////////////////////////////////////////////////////////////////////////////////
311
312/**
313 * Helper class that represents UTF8 (|char *|) strings. Useful in
314 * conjunction with Bstr to simplify conversions between UTF16 (|BSTR|)
315 * and UTF8.
316 *
317 * This class uses COM/XPCOM-provided memory management routines to allocate
318 * and free string buffers. This makes it possible to:
319 * - use it as a type of member variables of COM/XPCOM components and pass
320 * their values to callers through component methods' output parameters
321 * using the #cloneTo() operation;
322 * - adopt (take ownership of) string buffers returned in output parameters
323 * of COM methods using the #asOutParam() operation and correctly free them
324 * afterwards.
325 */
326class Utf8Str : public ministring
327{
328public:
329
330 Utf8Str() {}
331
332 Utf8Str(const Utf8Str &that)
333 : ministring(that)
334 {}
335
336 Utf8Str(const char *that)
337 : ministring(that)
338 {}
339
340 Utf8Str(const Bstr &that)
341 {
342 copyFrom(that);
343 }
344
345 Utf8Str(CBSTR that)
346 {
347 copyFrom(that);
348 }
349
350 Utf8Str& operator=(const Utf8Str &that)
351 {
352 ministring::operator=(that);
353 return *this;
354 }
355
356 Utf8Str& operator=(const char *that)
357 {
358 ministring::operator=(that);
359 return *this;
360 }
361
362 Utf8Str& operator=(const Bstr &that)
363 {
364 cleanup();
365 copyFrom(that);
366 return *this;
367 }
368
369 Utf8Str& operator=(CBSTR that)
370 {
371 cleanup();
372 copyFrom(that);
373 return *this;
374 }
375
376 /**
377 * Intended to assign instances to |char *| out parameters from within the
378 * interface method. Transfers the ownership of the duplicated string to the
379 * caller.
380 */
381 const Utf8Str& cloneTo(char **pstr) const
382 {
383 if (pstr)
384 *pstr = RTStrDup(m_psz);
385 return *this;
386 }
387
388 /**
389 * Intended to assign instances to |char *| out parameters from within the
390 * interface method. Transfers the ownership of the original string to the
391 * caller and resets the instance to null.
392 *
393 * As opposed to cloneTo(), this method doesn't create a copy of the
394 * string.
395 */
396 Utf8Str& detachTo(char **pstr)
397 {
398 *pstr = m_psz;
399 m_psz = NULL;
400 m_cbAllocated = 0;
401 m_cbLength = 0;
402 return *this;
403 }
404
405 /**
406 * Intended to assign instances to |BSTR| out parameters from within the
407 * interface method. Transfers the ownership of the duplicated string to the
408 * caller.
409 */
410 const Utf8Str& cloneTo(BSTR *pstr) const
411 {
412 if (pstr)
413 {
414 *pstr = NULL;
415 Bstr::raw_copy(*pstr, m_psz);
416 }
417 return *this;
418 }
419
420 static const size_t npos;
421
422 /**
423 * Looks for pcszFind in "this" starting at "pos" and returns its position,
424 * counting from the beginning of "this" at 0. Returns npos if not found.
425 */
426 size_t find(const char *pcszFind, size_t pos = 0) const;
427
428 /**
429 * Returns a substring of "this" as a new Utf8Str. Works exactly like
430 * its equivalent in std::string except that this interprets pos and n
431 * as UTF-8 codepoints instead of bytes. With the default parameters "0"
432 * and "npos", this always copies the entire string.
433 * @param pos Index of first codepoint to copy from "this", counting from 0.
434 * @param n Number of codepoints to copy, starting with the one at "pos".
435 */
436 Utf8Str substr(size_t pos = 0, size_t n = npos) const;
437
438 /**
439 * Returns true if "this" ends with "that".
440 * @param that
441 * @param cs
442 * @return
443 */
444 bool endsWith(const Utf8Str &that, CaseSensitivity cs = CaseSensitive) const;
445
446 /**
447 * Returns true if "this" begins with "that".
448 * @return
449 */
450 bool startsWith(const Utf8Str &that, CaseSensitivity cs = CaseSensitive) const;
451
452 /**
453 * Returns true if "this" contains "that" (strstr).
454 * @param that
455 * @param cs
456 * @return
457 */
458 bool contains(const Utf8Str &that, CaseSensitivity cs = CaseSensitive) const;
459
460 /**
461 * Converts "this" to lower case by calling RTStrToLower().
462 * @return
463 */
464 Utf8Str& toLower();
465
466 /**
467 * Converts "this" to upper case by calling RTStrToUpper().
468 * @return
469 */
470 Utf8Str& toUpper();
471
472 /**
473 * Removes a trailing slash from the member string, if present.
474 * Calls RTPathStripTrailingSlash() without having to mess with mutableRaw().
475 */
476 void stripTrailingSlash();
477
478 /**
479 * Removes a trailing filename from the member string, if present.
480 * Calls RTPathStripFilename() without having to mess with mutableRaw().
481 */
482 void stripFilename();
483
484 /**
485 * Removes a trailing file name extension from the member string, if present.
486 * Calls RTPathStripExt() without having to mess with mutableRaw().
487 */
488 void stripExt();
489
490 /**
491 * Attempts to convert the member string into a 32-bit integer.
492 *
493 * @returns 32-bit unsigned number on success.
494 * @returns 0 on failure.
495 */
496 int toInt32() const
497 {
498 return RTStrToInt32(m_psz);
499 }
500
501 /**
502 * Attempts to convert the member string into an unsigned 32-bit integer.
503 *
504 * @returns 32-bit unsigned number on success.
505 * @returns 0 on failure.
506 */
507 int toUInt32() const
508 {
509 return RTStrToUInt32(m_psz);
510 }
511
512 /**
513 * Attempts to convert the member string into an 64-bit integer.
514 *
515 * @returns 64-bit unsigned number on success.
516 * @returns 0 on failure.
517 */
518 int64_t toInt64() const
519 {
520 return RTStrToInt64(m_psz);
521 }
522
523 /**
524 * Attempts to convert the member string into an unsigned 64-bit integer.
525 *
526 * @returns 64-bit unsigned number on success.
527 * @returns 0 on failure.
528 */
529 uint64_t toUInt64() const
530 {
531 return RTStrToUInt64(m_psz);
532 }
533
534 /**
535 * Attempts to convert the member string into an unsigned 64-bit integer.
536 * @return IPRT error code.
537 * @param i Output buffer.
538 */
539 int toInt(uint64_t &i) const;
540
541 /**
542 * Attempts to convert the member string into an unsigned 32-bit integer.
543 * @return IPRT error code.
544 * @param i Output buffer.
545 */
546 int toInt(uint32_t &i) const;
547
548 /**
549 * Intended to pass instances as out (|char **|) parameters to methods.
550 * Takes the ownership of the returned data.
551 */
552 char **asOutParam()
553 {
554 cleanup();
555 return &m_psz;
556 }
557
558 /**
559 * Static immutable null object. May be used for comparison purposes.
560 */
561 static const Utf8Str Null;
562
563protected:
564
565 /**
566 * As with the ministring::copyFrom() variants, this unconditionally
567 * sets the members to a copy of the given other strings and makes
568 * no assumptions about previous contents. This can therefore be used
569 * both in copy constructors, when member variables have no defined
570 * value, and in assignments after having called cleanup().
571 *
572 * This variant converts from a UTF-16 string, most probably from
573 * a Bstr assignment.
574 *
575 * @param rs
576 */
577 void copyFrom(CBSTR s)
578 {
579 if (s)
580 {
581 RTUtf16ToUtf8((PRTUTF16)s, &m_psz);
582 m_cbLength = strlen(m_psz); // TODO optimize by using a different RTUtf* function
583 m_cbAllocated = m_cbLength + 1;
584 }
585 else
586 {
587 m_cbLength = 0;
588 m_cbAllocated = 0;
589 m_psz = NULL;
590 }
591 }
592
593 friend class Bstr; /* to access our raw_copy() */
594};
595
596// work around error C2593 of the stupid MSVC 7.x ambiguity resolver
597WORKAROUND_MSVC7_ERROR_C2593_FOR_BOOL_OP (Bstr)
598
599////////////////////////////////////////////////////////////////////////////////
600
601// inlined Bstr members that depend on Utf8Str
602
603inline Bstr::Bstr (const Utf8Str &that) : bstr (NULL) { raw_copy (bstr, that); }
604inline Bstr::Bstr (const char *that) : bstr (NULL) { raw_copy (bstr, that); }
605
606inline Bstr &Bstr::operator = (const Utf8Str &that)
607{
608 setNull();
609 raw_copy (bstr, that);
610 return *this;
611}
612inline Bstr &Bstr::operator = (const char *that)
613{
614 setNull();
615 raw_copy (bstr, that);
616 return *this;
617}
618
619inline const Bstr& Bstr::cloneTo(char **pstr) const
620{
621 if (pstr)
622 {
623 Utf8Str ustr(*this);
624 ustr.detachTo(pstr);
625 }
626 return *this;
627}
628
629////////////////////////////////////////////////////////////////////////////////
630
631/**
632 * This class is a printf-like formatter for Utf8Str strings. Its purpose is
633 * to construct Utf8Str objects from a format string and a list of arguments
634 * for the format string.
635 *
636 * The usage of this class is like the following:
637 * <code>
638 * Utf8StrFmt string ("program name = %s", argv[0]);
639 * </code>
640 */
641class Utf8StrFmt : public Utf8Str
642{
643public:
644
645 /**
646 * Constructs a new string given the format string and the list
647 * of the arguments for the format string.
648 *
649 * @param format printf-like format string (in UTF-8 encoding)
650 * @param ... list of the arguments for the format string
651 */
652 explicit Utf8StrFmt (const char *format, ...)
653 {
654 va_list args;
655 va_start (args, format);
656 init (format, args);
657 va_end (args);
658 }
659
660protected:
661
662 Utf8StrFmt() {}
663
664 void init (const char *format, va_list args);
665
666private:
667
668 static DECLCALLBACK(size_t) strOutput (void *pvArg, const char *pachChars,
669 size_t cbChars);
670};
671
672/**
673 * This class is a vprintf-like formatter for Utf8Str strings. It is
674 * identical to Utf8StrFmt except that its constructor takes a va_list
675 * argument instead of ellipsis.
676 *
677 * Note that a separate class is necessary because va_list is defined as
678 * |char *| on most platforms. For this reason, if we had two overloaded
679 * constructors in Utf8StrFmt (one taking ellipsis and another one taking
680 * va_list) then composing a constructor call using exactly two |char *|
681 * arguments would cause the compiler to use the va_list overload instead of
682 * the ellipsis one which is obviously wrong. The compiler would choose
683 * va_list because ellipsis has the lowest rank when it comes to resolving
684 * overloads, as opposed to va_list which is an exact match for |char *|.
685 */
686class Utf8StrFmtVA : public Utf8StrFmt
687{
688public:
689
690 /**
691 * Constructs a new string given the format string and the list
692 * of the arguments for the format string.
693 *
694 * @param format printf-like format string (in UTF-8 encoding)
695 * @param args list of arguments for the format string
696 */
697 Utf8StrFmtVA (const char *format, va_list args) { init (format, args); }
698};
699
700/**
701 * The BstrFmt class is a shortcut to <tt>Bstr (Utf8StrFmt (...))</tt>.
702 */
703class BstrFmt : public Bstr
704{
705public:
706
707 /**
708 * Constructs a new string given the format string and the list of the
709 * arguments for the format string.
710 *
711 * @param aFormat printf-like format string (in UTF-8 encoding).
712 * @param ... List of the arguments for the format string.
713 */
714 explicit BstrFmt (const char *aFormat, ...)
715 {
716 va_list args;
717 va_start (args, aFormat);
718 raw_copy (bstr, Utf8StrFmtVA (aFormat, args));
719 va_end (args);
720 }
721};
722
723/**
724 * The BstrFmtVA class is a shortcut to <tt>Bstr (Utf8StrFmtVA (...))</tt>.
725 */
726class BstrFmtVA : public Bstr
727{
728public:
729
730 /**
731 * Constructs a new string given the format string and the list of the
732 * arguments for the format string.
733 *
734 * @param aFormat printf-like format string (in UTF-8 encoding).
735 * @param aArgs List of arguments for the format string
736 */
737 BstrFmtVA (const char *aFormat, va_list aArgs)
738 {
739 raw_copy (bstr, Utf8StrFmtVA (aFormat, aArgs));
740 }
741};
742
743} /* namespace com */
744
745#endif /* ___VBox_com_string_h */
Note: See TracBrowser for help on using the repository browser.

© 2025 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette