summaryrefslogtreecommitdiff
path: root/oox/source/helper/textinputstream.cxx
blob: 8296144d73ec5b41854e7e5b3c89d30a321b17a3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
/*************************************************************************
 *
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * Copyright 2000, 2010 Oracle and/or its affiliates.
 *
 * OpenOffice.org - a multi-platform office productivity suite
 *
 * This file is part of OpenOffice.org.
 *
 * OpenOffice.org is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Lesser General Public License version 3
 * only, as published by the Free Software Foundation.
 *
 * OpenOffice.org is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Lesser General Public License version 3 for more details
 * (a copy is included in the LICENSE file that accompanied this code).
 *
 * You should have received a copy of the GNU Lesser General Public License
 * version 3 along with OpenOffice.org.  If not, see
 * <http://www.openoffice.org/license.html>
 * for a copy of the LGPLv3 License.
 *
 ************************************************************************/

#include "oox/helper/textinputstream.hxx"

#include <rtl/strbuf.hxx>
#include <rtl/ustrbuf.hxx>
#include "oox/helper/binaryinputstream.hxx"

namespace oox {

// ============================================================================

using ::rtl::OStringBuffer;
using ::rtl::OStringToOUString;
using ::rtl::OUString;
using ::rtl::OUStringBuffer;

// ============================================================================

namespace {

/** Reads a text line from stream. First, tries to skip the second character of
    a two-character line end sequence. Returns the new line-end character. */
template< typename BufferType, typename CharType, typename StreamDataType >
sal_Unicode lclReadLine( BufferType& orBuffer, BinaryInputStream& rInStrm, sal_Unicode cLastEolChar )
{
    // try to skip LF following CR, or CR following LF
    if( !rInStrm.isEof() && (cLastEolChar != 0) )
    {
        CharType cChar = static_cast< CharType >( rInStrm.readValue< StreamDataType >() );
        // return on EOF after line-end
        if( rInStrm.isEof() )
            return 0;
        // return on sequence of equal line-end characters
        bool bIsEolChar = (cChar == 10) || (cChar == 13);
        if( bIsEolChar && (cChar == cLastEolChar) )
            return cChar;
        // append the character, if it is not the other line-end charcter
        if( !bIsEolChar )
            orBuffer.append( cChar );
    }

    // read chars until EOF or line end character (LF or CR)
    while( true )
    {
        CharType cChar = static_cast< CharType >( rInStrm.readValue< StreamDataType >() );
        if( rInStrm.isEof() )
            return 0;
        if( (cChar == 10) || (cChar == 13) )
            return cChar;
        orBuffer.append( cChar );
    }
}

} // namespace

// ============================================================================

TextInputStream::TextInputStream( BinaryInputStream& rInStrm, rtl_TextEncoding eTextEnc ) :
    mrInStrm( rInStrm ),
    meTextEnc( eTextEnc ),
    mcLastEolChar( 0 )
{
}

bool TextInputStream::isEof() const
{
    // do not return EOF, if last text line missed line-end character (see below)
    return mrInStrm.isEof() && (mcLastEolChar == 0);
}

OUString TextInputStream::readLine()
{
    if( mrInStrm.isEof() )
    {
        mcLastEolChar = 0;
        return OUString();
    }

    OUString aLine;
    if( meTextEnc == RTL_TEXTENCODING_UCS2 )
    {
        // read 16-bit characters for UCS2 encoding
        OUStringBuffer aBuffer;
        mcLastEolChar = lclReadLine< OUStringBuffer, sal_Unicode, sal_uInt16 >( aBuffer, mrInStrm, mcLastEolChar );
        aLine = aBuffer.makeStringAndClear();
    }
    else
    {
        // otherwise, read 8-bit characters and convert according to text encoding
        OStringBuffer aBuffer;
        mcLastEolChar = lclReadLine< OStringBuffer, sal_Char, sal_uInt8 >( aBuffer, mrInStrm, mcLastEolChar );
        aLine = OStringToOUString( aBuffer.makeStringAndClear(), meTextEnc );
    }

    // if last line is not empty but line-end character is missing, do not return EOF
    if( mrInStrm.isEof() && (aLine.getLength() > 0) )
        mcLastEolChar = 10;

    return aLine;
}

// ============================================================================

} // namespace oox

/* vim:set shiftwidth=4 softtabstop=4 expandtab: */