f558eb09dc
V1024 The 'aStream' stream is checked for EOF before reading from it, but is not checked after reading. Potential use of invalid data. Change-Id: I4f7b10bc896d13a31a97ed0dbacd413de990eb89 Reviewed-on: https://gerrit.libreoffice.org/c/core/+/175363 Tested-by: Jenkins Reviewed-by: Xisco Fauli <xiscofauli@libreoffice.org> Reviewed-by: Mike Kaganski <mike.kaganski@collabora.com>
278 lines
8.4 KiB
C++
278 lines
8.4 KiB
C++
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
|
/*
|
|
* This file is part of the LibreOffice project.
|
|
*
|
|
* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
*
|
|
* This file incorporates work covered by the following license notice:
|
|
*
|
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
|
* contributor license agreements. See the NOTICE file distributed
|
|
* with this work for additional information regarding copyright
|
|
* ownership. The ASF licenses this file to you under the Apache
|
|
* License, Version 2.0 (the "License"); you may not use this file
|
|
* except in compliance with the License. You may obtain a copy of
|
|
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
|
|
*/
|
|
|
|
#include <sal/config.h>
|
|
|
|
#include <o3tl/string_view.hxx>
|
|
|
|
#include <cstddef>
|
|
#include <iostream>
|
|
#include <memory>
|
|
#include <string>
|
|
|
|
#include <common.hxx>
|
|
#include <po.hxx>
|
|
#include <lngmerge.hxx>
|
|
#include <utility>
|
|
|
|
namespace {
|
|
|
|
bool lcl_isNextGroup(OString &sGroup_out, std::string_view sLineTrim)
|
|
{
|
|
if (o3tl::starts_with(sLineTrim, "[") && o3tl::ends_with(sLineTrim, "]"))
|
|
{
|
|
sLineTrim = o3tl::getToken(sLineTrim, 1, '[');
|
|
sLineTrim = o3tl::getToken(sLineTrim, 0, ']');
|
|
sGroup_out = OString(o3tl::trim(sLineTrim));
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
void lcl_RemoveUTF8ByteOrderMarker( OString &rString )
|
|
{
|
|
if( rString.getLength() >= 3 && rString[0] == '\xEF' &&
|
|
rString[1] == '\xBB' && rString[2] == '\xBF' )
|
|
{
|
|
rString = rString.copy(3);
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
LngParser::LngParser(OString sLngFile)
|
|
: sSource(std::move( sLngFile ))
|
|
{
|
|
std::ifstream aStream(sSource.getStr());
|
|
if (!aStream.is_open())
|
|
return;
|
|
|
|
bool bFirstLine = true;
|
|
std::string s;
|
|
while (std::getline(aStream, s))
|
|
{
|
|
OString sLine(s.data(), s.length());
|
|
|
|
if( bFirstLine )
|
|
{
|
|
// Always remove UTF8 BOM from the first line
|
|
lcl_RemoveUTF8ByteOrderMarker( sLine );
|
|
bFirstLine = false;
|
|
}
|
|
|
|
mvLines.push_back( sLine );
|
|
}
|
|
mvLines.push_back( OString() );
|
|
}
|
|
|
|
LngParser::~LngParser()
|
|
{
|
|
}
|
|
|
|
void LngParser::CreatePO( const OString &rPOFile )
|
|
{
|
|
PoOfstream aPOStream( rPOFile, PoOfstream::APP );
|
|
if (!aPOStream.isOpen()) {
|
|
std::cerr << "Ulfex error: Can't open po file:" << rPOFile << "\n";
|
|
}
|
|
|
|
size_t nPos = 0;
|
|
bool bStart = true;
|
|
OString sGroup, sLine;
|
|
OStringHashMap Text;
|
|
OString sID;
|
|
|
|
while( nPos < mvLines.size() ) {
|
|
sLine = mvLines[ nPos++ ];
|
|
while( nPos < mvLines.size() && !isNextGroup( sGroup , sLine ) ) {
|
|
ReadLine( sLine , Text );
|
|
sID = sGroup;
|
|
sLine = mvLines[ nPos++ ];
|
|
}
|
|
if( bStart ) {
|
|
bStart = false;
|
|
sID = sGroup;
|
|
}
|
|
else {
|
|
WritePO( aPOStream , Text , sSource , sID );
|
|
}
|
|
Text.erase("x-comment"_ostr);
|
|
}
|
|
aPOStream.close();
|
|
}
|
|
|
|
void LngParser::WritePO(PoOfstream &aPOStream,
|
|
OStringHashMap &rText_inout, const OString &rActFileName,
|
|
const OString &rID)
|
|
{
|
|
common::writePoEntry(
|
|
"Ulfex"_ostr, aPOStream, rActFileName, "LngText",
|
|
rID, OString(), rText_inout.count("x-comment"_ostr) ? rText_inout["x-comment"_ostr] : OString(), rText_inout["en-US"_ostr]);
|
|
}
|
|
|
|
bool LngParser::isNextGroup(OString &sGroup_out, std::string_view sLine_in)
|
|
{
|
|
return lcl_isNextGroup(sGroup_out, o3tl::trim(sLine_in));
|
|
}
|
|
|
|
void LngParser::ReadLine(std::string_view rLine_in,
|
|
OStringHashMap &rText_inout)
|
|
{
|
|
if (!o3tl::starts_with(rLine_in, " *") && !o3tl::starts_with(rLine_in, "/*"))
|
|
{
|
|
OString sLang(o3tl::trim(o3tl::getToken(rLine_in, 0, '=')));
|
|
if (!sLang.isEmpty()) {
|
|
rText_inout[sLang] = OString(o3tl::getToken(rLine_in, 1, '"'));
|
|
}
|
|
}
|
|
}
|
|
|
|
void LngParser::Merge(
|
|
const OString &rPOFile,
|
|
const OString &rDestinationFile,
|
|
std::string_view rLanguage )
|
|
{
|
|
std::ofstream aDestination(
|
|
rDestinationFile.getStr(), std::ios_base::out | std::ios_base::trunc);
|
|
|
|
MergeDataFile aMergeDataFile( rPOFile, sSource, false, true );
|
|
if( o3tl::equalsIgnoreAsciiCase(rLanguage, "ALL") )
|
|
aLanguages = aMergeDataFile.GetLanguages();
|
|
|
|
size_t nPos = 0;
|
|
bool bGroup = false;
|
|
OString sGroup;
|
|
|
|
// seek to next group
|
|
while ( nPos < mvLines.size() && !bGroup )
|
|
bGroup = lcl_isNextGroup(sGroup, o3tl::trim(mvLines[nPos++]));
|
|
|
|
while ( nPos < mvLines.size()) {
|
|
OStringHashMap Text;
|
|
OString sID( sGroup );
|
|
std::size_t nLastLangPos = 0;
|
|
|
|
ResData aResData( sID, sSource );
|
|
aResData.sResTyp = "LngText"_ostr;
|
|
MergeEntrys *pEntrys = aMergeDataFile.GetMergeEntrys( &aResData );
|
|
// read languages
|
|
bGroup = false;
|
|
|
|
OString sLanguagesDone;
|
|
|
|
while ( nPos < mvLines.size() && !bGroup )
|
|
{
|
|
const OString sLine{ mvLines[nPos].trim() };
|
|
if ( lcl_isNextGroup(sGroup, sLine) )
|
|
{
|
|
bGroup = true;
|
|
nPos ++;
|
|
sLanguagesDone = ""_ostr;
|
|
}
|
|
else
|
|
{
|
|
sal_Int32 n = 0;
|
|
OString sLang(sLine.getToken(0, '=', n));
|
|
if (n == -1 || static_cast<bool>(sLine.match("/*")))
|
|
{
|
|
++nPos;
|
|
}
|
|
else
|
|
{
|
|
sLang = sLang.trim();
|
|
|
|
OString sSearch{ ";" + sLang + ";" };
|
|
|
|
if ( sLanguagesDone.indexOf( sSearch ) != -1 ) {
|
|
mvLines.erase( mvLines.begin() + nPos );
|
|
}
|
|
if( pEntrys )
|
|
{
|
|
if( !sLang.isEmpty() )
|
|
{
|
|
OString sNewText;
|
|
pEntrys->GetText( sNewText, sLang, true );
|
|
if( sLang == "qtz" )
|
|
continue;
|
|
|
|
if ( !sNewText.isEmpty()) {
|
|
mvLines[ nPos ] = sLang
|
|
+ " = \""
|
|
// escape quotes, unescape double escaped quotes fdo#56648
|
|
+ sNewText.replaceAll("\""_ostr,"\\\""_ostr).replaceAll("\\\\\""_ostr,"\\\""_ostr)
|
|
+ "\"";
|
|
Text[ sLang ] = sNewText;
|
|
}
|
|
}
|
|
nLastLangPos = nPos;
|
|
nPos ++;
|
|
sLanguagesDone += sSearch;
|
|
}
|
|
else {
|
|
nLastLangPos = nPos;
|
|
nPos ++;
|
|
sLanguagesDone += sSearch;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
OString sCur;
|
|
if ( nLastLangPos )
|
|
{
|
|
for(size_t n = 0; n < aLanguages.size(); ++n)
|
|
{
|
|
sCur = aLanguages[ n ];
|
|
if( !sCur.equalsIgnoreAsciiCase("en-US") && Text[sCur].isEmpty() && pEntrys )
|
|
{
|
|
|
|
OString sNewText;
|
|
pEntrys->GetText( sNewText, sCur, true );
|
|
if( sCur == "qtz" )
|
|
continue;
|
|
if ( !sNewText.isEmpty() && sCur != "x-comment")
|
|
{
|
|
const OString sLine { sCur
|
|
+ " = \""
|
|
// escape quotes, unescape double escaped quotes fdo#56648
|
|
+ sNewText.replaceAll("\""_ostr,"\\\""_ostr).replaceAll("\\\\\""_ostr,"\\\""_ostr)
|
|
+ "\"" };
|
|
|
|
nLastLangPos++;
|
|
nPos++;
|
|
|
|
if ( nLastLangPos < mvLines.size() ) {
|
|
mvLines.insert( mvLines.begin() + nLastLangPos, sLine );
|
|
} else {
|
|
mvLines.push_back( sLine );
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
for ( size_t i = 0; i < mvLines.size(); ++i )
|
|
aDestination << mvLines[i] << '\n';
|
|
|
|
aDestination.close();
|
|
}
|
|
|
|
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
|