office-gobmx/l10ntools/source/lngmerge.cxx
Xisco Fauli f558eb09dc tdf#163486: PVS: check stream read instead of EOF
V1024 	The 'aStream' stream is checked for EOF before reading from it, but is not checked after reading. Potential use of invalid data.

Change-Id: I4f7b10bc896d13a31a97ed0dbacd413de990eb89
Reviewed-on: https://gerrit.libreoffice.org/c/core/+/175363
Tested-by: Jenkins
Reviewed-by: Xisco Fauli <xiscofauli@libreoffice.org>
Reviewed-by: Mike Kaganski <mike.kaganski@collabora.com>
2024-10-22 12:43:28 +02:00

278 lines
8.4 KiB
C++

/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
/*
* This file is part of the LibreOffice project.
*
* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
*
* This file incorporates work covered by the following license notice:
*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed
* with this work for additional information regarding copyright
* ownership. The ASF licenses this file to you under the Apache
* License, Version 2.0 (the "License"); you may not use this file
* except in compliance with the License. You may obtain a copy of
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
*/
#include <sal/config.h>
#include <o3tl/string_view.hxx>
#include <cstddef>
#include <iostream>
#include <memory>
#include <string>
#include <common.hxx>
#include <po.hxx>
#include <lngmerge.hxx>
#include <utility>
namespace {
bool lcl_isNextGroup(OString &sGroup_out, std::string_view sLineTrim)
{
if (o3tl::starts_with(sLineTrim, "[") && o3tl::ends_with(sLineTrim, "]"))
{
sLineTrim = o3tl::getToken(sLineTrim, 1, '[');
sLineTrim = o3tl::getToken(sLineTrim, 0, ']');
sGroup_out = OString(o3tl::trim(sLineTrim));
return true;
}
return false;
}
void lcl_RemoveUTF8ByteOrderMarker( OString &rString )
{
if( rString.getLength() >= 3 && rString[0] == '\xEF' &&
rString[1] == '\xBB' && rString[2] == '\xBF' )
{
rString = rString.copy(3);
}
}
}
LngParser::LngParser(OString sLngFile)
: sSource(std::move( sLngFile ))
{
std::ifstream aStream(sSource.getStr());
if (!aStream.is_open())
return;
bool bFirstLine = true;
std::string s;
while (std::getline(aStream, s))
{
OString sLine(s.data(), s.length());
if( bFirstLine )
{
// Always remove UTF8 BOM from the first line
lcl_RemoveUTF8ByteOrderMarker( sLine );
bFirstLine = false;
}
mvLines.push_back( sLine );
}
mvLines.push_back( OString() );
}
LngParser::~LngParser()
{
}
void LngParser::CreatePO( const OString &rPOFile )
{
PoOfstream aPOStream( rPOFile, PoOfstream::APP );
if (!aPOStream.isOpen()) {
std::cerr << "Ulfex error: Can't open po file:" << rPOFile << "\n";
}
size_t nPos = 0;
bool bStart = true;
OString sGroup, sLine;
OStringHashMap Text;
OString sID;
while( nPos < mvLines.size() ) {
sLine = mvLines[ nPos++ ];
while( nPos < mvLines.size() && !isNextGroup( sGroup , sLine ) ) {
ReadLine( sLine , Text );
sID = sGroup;
sLine = mvLines[ nPos++ ];
}
if( bStart ) {
bStart = false;
sID = sGroup;
}
else {
WritePO( aPOStream , Text , sSource , sID );
}
Text.erase("x-comment"_ostr);
}
aPOStream.close();
}
void LngParser::WritePO(PoOfstream &aPOStream,
OStringHashMap &rText_inout, const OString &rActFileName,
const OString &rID)
{
common::writePoEntry(
"Ulfex"_ostr, aPOStream, rActFileName, "LngText",
rID, OString(), rText_inout.count("x-comment"_ostr) ? rText_inout["x-comment"_ostr] : OString(), rText_inout["en-US"_ostr]);
}
bool LngParser::isNextGroup(OString &sGroup_out, std::string_view sLine_in)
{
return lcl_isNextGroup(sGroup_out, o3tl::trim(sLine_in));
}
void LngParser::ReadLine(std::string_view rLine_in,
OStringHashMap &rText_inout)
{
if (!o3tl::starts_with(rLine_in, " *") && !o3tl::starts_with(rLine_in, "/*"))
{
OString sLang(o3tl::trim(o3tl::getToken(rLine_in, 0, '=')));
if (!sLang.isEmpty()) {
rText_inout[sLang] = OString(o3tl::getToken(rLine_in, 1, '"'));
}
}
}
void LngParser::Merge(
const OString &rPOFile,
const OString &rDestinationFile,
std::string_view rLanguage )
{
std::ofstream aDestination(
rDestinationFile.getStr(), std::ios_base::out | std::ios_base::trunc);
MergeDataFile aMergeDataFile( rPOFile, sSource, false, true );
if( o3tl::equalsIgnoreAsciiCase(rLanguage, "ALL") )
aLanguages = aMergeDataFile.GetLanguages();
size_t nPos = 0;
bool bGroup = false;
OString sGroup;
// seek to next group
while ( nPos < mvLines.size() && !bGroup )
bGroup = lcl_isNextGroup(sGroup, o3tl::trim(mvLines[nPos++]));
while ( nPos < mvLines.size()) {
OStringHashMap Text;
OString sID( sGroup );
std::size_t nLastLangPos = 0;
ResData aResData( sID, sSource );
aResData.sResTyp = "LngText"_ostr;
MergeEntrys *pEntrys = aMergeDataFile.GetMergeEntrys( &aResData );
// read languages
bGroup = false;
OString sLanguagesDone;
while ( nPos < mvLines.size() && !bGroup )
{
const OString sLine{ mvLines[nPos].trim() };
if ( lcl_isNextGroup(sGroup, sLine) )
{
bGroup = true;
nPos ++;
sLanguagesDone = ""_ostr;
}
else
{
sal_Int32 n = 0;
OString sLang(sLine.getToken(0, '=', n));
if (n == -1 || static_cast<bool>(sLine.match("/*")))
{
++nPos;
}
else
{
sLang = sLang.trim();
OString sSearch{ ";" + sLang + ";" };
if ( sLanguagesDone.indexOf( sSearch ) != -1 ) {
mvLines.erase( mvLines.begin() + nPos );
}
if( pEntrys )
{
if( !sLang.isEmpty() )
{
OString sNewText;
pEntrys->GetText( sNewText, sLang, true );
if( sLang == "qtz" )
continue;
if ( !sNewText.isEmpty()) {
mvLines[ nPos ] = sLang
+ " = \""
// escape quotes, unescape double escaped quotes fdo#56648
+ sNewText.replaceAll("\""_ostr,"\\\""_ostr).replaceAll("\\\\\""_ostr,"\\\""_ostr)
+ "\"";
Text[ sLang ] = sNewText;
}
}
nLastLangPos = nPos;
nPos ++;
sLanguagesDone += sSearch;
}
else {
nLastLangPos = nPos;
nPos ++;
sLanguagesDone += sSearch;
}
}
}
}
OString sCur;
if ( nLastLangPos )
{
for(size_t n = 0; n < aLanguages.size(); ++n)
{
sCur = aLanguages[ n ];
if( !sCur.equalsIgnoreAsciiCase("en-US") && Text[sCur].isEmpty() && pEntrys )
{
OString sNewText;
pEntrys->GetText( sNewText, sCur, true );
if( sCur == "qtz" )
continue;
if ( !sNewText.isEmpty() && sCur != "x-comment")
{
const OString sLine { sCur
+ " = \""
// escape quotes, unescape double escaped quotes fdo#56648
+ sNewText.replaceAll("\""_ostr,"\\\""_ostr).replaceAll("\\\\\""_ostr,"\\\""_ostr)
+ "\"" };
nLastLangPos++;
nPos++;
if ( nLastLangPos < mvLines.size() ) {
mvLines.insert( mvLines.begin() + nLastLangPos, sLine );
} else {
mvLines.push_back( sLine );
}
}
}
}
}
}
for ( size_t i = 0; i < mvLines.size(); ++i )
aDestination << mvLines[i] << '\n';
aDestination.close();
}
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */