f365b17bf1
jvmaccess, jvmfwk, l10ntools, libreofficekit and linguistic Change-Id: I9d290d1098b25ccb3aee19d2df18c18f4aa65105 Reviewed-on: https://gerrit.libreoffice.org/51495 Reviewed-by: Noel Grandin <noel.grandin@collabora.co.uk> Tested-by: Jenkins <ci@libreoffice.org> Reviewed-by: Julien Nabet <serval2412@yahoo.fr>
93 lines
3.1 KiB
C++
93 lines
3.1 KiB
C++
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
|
/*
|
|
* This file is part of the LibreOffice project.
|
|
*
|
|
* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
*/
|
|
|
|
#include <cerrno>
|
|
#include <iostream>
|
|
#include <fstream>
|
|
#include <string>
|
|
#include <map>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
|
|
static const int MAXLINE = 1024*64;
|
|
|
|
using namespace std;
|
|
|
|
int main(int argc, char *argv[])
|
|
{
|
|
if (argc != 3 || strcmp(argv[1],"-o"))
|
|
{
|
|
cout << "Usage: idxdict -o outputfile < input\n";
|
|
::exit(99);
|
|
}
|
|
// This call improves performance by approx 5x
|
|
std::ios_base::sync_with_stdio(false);
|
|
|
|
const char * outputFile(argv[2]);
|
|
char inputBuffer[MAXLINE];
|
|
multimap<string, size_t> entries;
|
|
multimap<string,size_t>::iterator ret(entries.begin());
|
|
|
|
int line(1);
|
|
cin.getline(inputBuffer, MAXLINE);
|
|
const string encoding(inputBuffer);
|
|
size_t currentOffset(encoding.size()+1);
|
|
while (true)
|
|
{
|
|
// Extract the next word, but not the entry count
|
|
cin.getline(inputBuffer, MAXLINE, '|');
|
|
|
|
if (cin.eof()) break;
|
|
|
|
string word(inputBuffer);
|
|
ret = entries.insert(ret, pair<string, size_t>(word, currentOffset));
|
|
currentOffset += word.size() + 1;
|
|
// Next is the entry count
|
|
cin.getline(inputBuffer, MAXLINE);
|
|
if (!cin.good())
|
|
{
|
|
cerr << "Unable to read entry - insufficient buffer?.\n";
|
|
exit(99);
|
|
}
|
|
currentOffset += strlen(inputBuffer)+1;
|
|
char * endptr;
|
|
errno = 0;
|
|
int entryCount(strtol(inputBuffer, &endptr, 10));
|
|
if (errno != 0 || endptr == inputBuffer || *endptr != '\0')
|
|
{
|
|
cerr
|
|
<< "Unable to read count from \"" << inputBuffer
|
|
<< "\" input.\n";
|
|
exit(99);
|
|
}
|
|
for (int i(0); i < entryCount; ++i)
|
|
{
|
|
cin.getline(inputBuffer, MAXLINE);
|
|
currentOffset += strlen(inputBuffer)+1;
|
|
++line;
|
|
}
|
|
}
|
|
|
|
// Use binary mode to prevent any translation of LF to CRLF on Windows
|
|
ofstream outputStream(outputFile, ios_base::binary| ios_base::trunc|ios_base::out);
|
|
if (!outputStream.is_open())
|
|
{
|
|
cerr << "Unable to open output file " << outputFile << endl;
|
|
::exit(99);
|
|
}
|
|
|
|
outputStream << encoding << '\n' << entries.size() << '\n';
|
|
|
|
for (auto const& entry : entries)
|
|
{
|
|
outputStream << entry.first << '|' << entry.second << '\n';
|
|
}
|
|
}
|
|
|
|
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
|