mirror of
git://git.savannah.nongnu.org/eliot.git
synced 2025-01-16 03:45:39 +01:00
172 lines
4.8 KiB
C++
172 lines
4.8 KiB
C++
/*****************************************************************************
|
|
* Eliot
|
|
* Copyright (C) 2012 Olivier Teulière
|
|
* Authors: Olivier Teulière <ipkiss @@ gmail.com>
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*****************************************************************************/
|
|
|
|
#include <boost/foreach.hpp>
|
|
#include <boost/format.hpp>
|
|
|
|
#include "csv_helper.h"
|
|
|
|
#include "debug.h"
|
|
|
|
#if ENABLE_NLS
|
|
# include <libintl.h>
|
|
# define _(String) gettext(String)
|
|
#else
|
|
# define _(String) String
|
|
#endif
|
|
|
|
using namespace std;
|
|
|
|
INIT_LOGGER(qt, CsvHelper);
|
|
|
|
|
|
vector<CsvHelper::DataRow> CsvHelper::readStream(istream &input)
|
|
{
|
|
vector<DataRow> data;
|
|
size_t minLength = (size_t) -1;
|
|
size_t maxLength = 0;
|
|
string line;
|
|
string currField;
|
|
// XXX: Using getline() prevents from parsing newline chars in fields.
|
|
// But this limitation is not very big, and it makes the code way simpler.
|
|
while (getline(input, line))
|
|
{
|
|
DataRow row;
|
|
// Parse the line
|
|
bool inQuotes = false;
|
|
size_t pos = 0;
|
|
while (pos < line.size())
|
|
{
|
|
char c = line[pos];
|
|
if (c == ',' && !inQuotes)
|
|
{
|
|
// Field separator
|
|
row.push_back(currField);
|
|
currField.clear();
|
|
}
|
|
else if (c == '"')
|
|
{
|
|
if (inQuotes)
|
|
{
|
|
// Is the next char also a quote?
|
|
if (pos + 1 < line.size() && line[pos + 1] == '"')
|
|
{
|
|
// Escaped quote
|
|
currField.push_back(c);
|
|
++pos;
|
|
}
|
|
else
|
|
{
|
|
// End of quotation
|
|
inQuotes = false;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
if (currField.empty())
|
|
{
|
|
// Beginning of quotation
|
|
inQuotes = true;
|
|
}
|
|
else
|
|
{
|
|
// Normal quote in an unquoted field
|
|
currField.push_back(c);
|
|
}
|
|
}
|
|
}
|
|
else if (c != '\r' && c != '\n')
|
|
{
|
|
// Normal char
|
|
currField.push_back(c);
|
|
}
|
|
|
|
// Next char
|
|
++pos;
|
|
}
|
|
|
|
// Add the last field of the line
|
|
row.push_back(currField);
|
|
currField.clear();
|
|
|
|
data.push_back(row);
|
|
|
|
if (minLength > row.size())
|
|
minLength = row.size();
|
|
if (maxLength < row.size())
|
|
maxLength = row.size();
|
|
}
|
|
|
|
// Normalization (to be tolerant to faulty inputs)
|
|
if (minLength != maxLength)
|
|
{
|
|
boost::format fmt(_("Invalid CSV file (variable number of fields, from %1% to %2%)"));
|
|
throw CsvException((fmt % minLength % maxLength).str());
|
|
}
|
|
|
|
return data;
|
|
}
|
|
|
|
|
|
void CsvHelper::writeStream(ostream &output, const vector<DataRow> &iData)
|
|
{
|
|
if (iData.empty())
|
|
return;
|
|
|
|
// Make sure the rows have the same number of fields
|
|
size_t firstLength = iData.front().size();
|
|
BOOST_FOREACH(const DataRow &row, iData)
|
|
{
|
|
if (row.size() != firstLength)
|
|
throw CsvException(_("Invalid CSV data (variable number of fields)"));
|
|
}
|
|
|
|
BOOST_FOREACH(const DataRow &row, iData)
|
|
{
|
|
bool first = true;
|
|
BOOST_FOREACH(const string &field, row)
|
|
{
|
|
// Add the comma
|
|
if (first)
|
|
first = false;
|
|
else
|
|
output << ',';
|
|
|
|
// Needs quoting?
|
|
if (field.find_first_of(",\"\n") == string::npos)
|
|
output << field;
|
|
else
|
|
{
|
|
output << '"';
|
|
BOOST_FOREACH(char c, field)
|
|
{
|
|
output << c;
|
|
// Double the quote
|
|
if (c == '"')
|
|
output << '"';
|
|
}
|
|
output << '"';
|
|
}
|
|
}
|
|
// End of the row (CR + LF)
|
|
output << "\r\n";
|
|
}
|
|
}
|
|
|