95 map<size_t, col_t> columns;
98 for (
auto it=cols.begin(); it!=cols.end(); it++)
102 c.offset = it->second.offset;
103 c.size = it->second.size;
104 c.num = it->second.num;
106 c.ptr = f.SetPtrAddress(it->first);
108 columns[c.offset] = c;
110 row_tot += c.size*c.num;
116 header.resize(f.tellg());
119 f.read((
char*)header.c_str(), header.size());
125 const size_t hlen = 0;
127 size_t hs = header.size();
130 fout.write((
char*)&hlen,
sizeof(
size_t));
131 fout.write((
char*)&hs,
sizeof(
size_t));
132 fout.write(header.c_str(), header.size());
134 tot += header.size();
135 com += header.size()+2+2*
sizeof(size_t);
142 vector<char> cache(row_tot);
143 while (f.GetNextRow())
146 char *out = cache.data();
149 vector<uint8_t> mask(cols.size()/8 + 1);
153 for (
auto it=columns.begin(); it!=columns.end(); it++, icol++)
156 const size_t len_col = it->second.size * it->second.num;
159 int16_t *ptr = (int16_t*)it->second.ptr;
178 if (len_col>32 && it->second.size==2)
190 if (buf.size()<len_col)
193 memcpy(out, buf.c_str(), buf.size());
197 const uint64_t bit = (icol%8);
198 mask[icol/8] |= (1<<bit);
205 memcpy(out, (
char*)ptr, len_col);
210 const size_t sz = out-cache.data();
214 com += sz + mask.size();
217 fout.write((
char*)mask.data(), mask.size());
218 fout.write(cache.data(), sz);
223 const float proc = float(f.GetRow())/f.GetNumRows();
227 cout <<
"\r" << setprecision(0) << setw(3) << 100*proc <<
"% [" << setprecision(1) << setw(5) << 100.*com/tot <<
"%] cpu:" << sec <<
"s in:" << tot/1000000/elep <<
"MB/s" << flush;
233 cout << setprecision(0) <<
"\r100% [" << setprecision(1) << setw(5) << 100.*com/tot <<
"%] cpu:" << sec <<
"s in:" << tot/1000000/elep <<
"MB/s" << endl;
std::map< std::string, Column > Columns
Adds some functionality to boost::posix_time::ptime for our needs.
bool Encode(std::string &bufout, const uint16_t *bufin, size_t bufinlen)