65 lines
1.8 KiB
C++
65 lines
1.8 KiB
C++
#ifndef PARQUET_CURSOR_H
|
|
#define PARQUET_CURSOR_H
|
|
|
|
#include "parquet_filter.h"
|
|
#include "parquet_table.h"
|
|
#include "parquet/api/reader.h"
|
|
|
|
class ParquetCursor {
|
|
|
|
ParquetTable* table;
|
|
std::unique_ptr<parquet::ParquetFileReader> reader;
|
|
std::unique_ptr<parquet::RowGroupMetaData> rowGroupMetadata;
|
|
std::shared_ptr<parquet::RowGroupReader> rowGroup;
|
|
std::vector<std::shared_ptr<parquet::Scanner>> scanners;
|
|
std::vector<parquet::Type::type> types;
|
|
std::vector<parquet::LogicalType::type> logicalTypes;
|
|
|
|
std::vector<int> colRows;
|
|
std::vector<bool> colNulls;
|
|
std::vector<int64_t> colIntValues;
|
|
std::vector<double> colDoubleValues;
|
|
std::vector<parquet::ByteArray> colByteArrayValues;
|
|
|
|
int rowId;
|
|
int rowGroupId;
|
|
int rowGroupStartRowId;
|
|
int rowGroupSize;
|
|
int numRows;
|
|
int numRowGroups;
|
|
int rowsLeftInRowGroup;
|
|
|
|
bool nextRowGroup();
|
|
|
|
std::vector<Constraint> constraints;
|
|
|
|
bool currentRowSatisfiesFilter();
|
|
bool currentRowGroupSatisfiesFilter();
|
|
bool currentRowGroupSatisfiesRowIdFilter(Constraint constraint);
|
|
bool currentRowGroupSatisfiesTextFilter(Constraint constraint, std::shared_ptr<parquet::RowGroupStatistics> stats);
|
|
bool currentRowGroupSatisfiesIntegerFilter(Constraint constraint, std::shared_ptr<parquet::RowGroupStatistics> stats);
|
|
bool currentRowGroupSatisfiesDoubleFilter(Constraint constraint, std::shared_ptr<parquet::RowGroupStatistics> stats);
|
|
|
|
public:
|
|
ParquetCursor(ParquetTable* table);
|
|
int getRowId();
|
|
void next();
|
|
void close();
|
|
void reset(std::vector<Constraint> constraints);
|
|
bool eof();
|
|
|
|
void ensureColumn(int col);
|
|
bool isNull(int col);
|
|
parquet::Type::type getPhysicalType(int col);
|
|
parquet::LogicalType::type getLogicalType(int col);
|
|
ParquetTable* getTable();
|
|
|
|
int getInt32(int col);
|
|
long getInt64(int col);
|
|
double getDouble(int col);
|
|
parquet::ByteArray* getByteArray(int col);
|
|
};
|
|
|
|
#endif
|
|
|