aboutsummaryrefslogtreecommitdiff
path: root/src/unstable/text.h
blob: 1d623ff3845a2958b98554f92327d2dffcc5e76d (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
/*
 * Copyright (C) 2007-2019 Xagasoft, All rights reserved.
 *
 * This file is part of the libbu++ library and is released under the
 * terms of the license contained in the file LICENSE.
 */

#ifndef BU_TEXT_H
#define BU_TEXT_H

#include "bu/config.h"

namespace Bu
{
    /**
     * Represents a string of text. Human readable language. This should be
     * used any time you're dealing with actual text and not just binary
     * data. If you neeed to transport raw binary data then consider using
     * Blob and BlobBuilder.
     *
     * Text objects should be considered immutable.  If you need to construct
     * a Text object dynamically take a look at TextBuilder, and for
     * serialization take a look at TextStream.
     *
     * A Text object is a sequence of Unicode code points. A code point is not
     * one to one with a character. A single character can be represented with
     * multilpe code points. In addition, a code point can also represent
     * formatting or display inforamtion.
     *
     * Internally all data is stored in UTF-16, which is a fair compromise for
     * mose text.  All characters from all modern natural languages fit within
     * the Basic Multilingual Plane, which requires only a single 16 bit value
     * to represent it.  However, when iterating through or addressing data
     * in the Text object all work is done on a code point basis.
     */
    class Text
    {
    public:
        class iterator;
        class const_iterator;
        typedef uint32_t CodePoint;

    public:
        Text();
        Text( const Text &rSrc );
        virtual ~Text();

        bool isEmpty() const;
        bool isBmpOnly() const;
        int32_t getSize() const;
        int32_t getSizeInBytes() const;

        uint16_t *getRawData() const;
//        Text transform( (CodePoint *)(*pCallback)( CodePoint * ) );

    private:
        uint16_t *pData;
        int32_t iSize;
        int32_t iCodePoints;
    };
    typedef Text::CodePoint CodePoint;
}

#endif