summaryrefslogtreecommitdiff
path: root/tools/fileDataProvider.h
blob: 972a4c5b1a76d658666d670b00df06ae35925cc8 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
#ifndef FDPROV_H
#define FDPROV_H

#include "dataProvider.h"
#include "easylogging++.h"
#include <string>
#include <iostream>
#include <fstream>

// Rank qid features

class FileDP:public DataProvider
{
private:
    std::string fname;
    std::ifstream fin;
public:
    FileDP(std::string fn=""):fname(fn){};
    virtual int getDataSet(DataList &out);
    virtual void getAllDataSet(RidList &out){ LOG(FATAL)<<"getAllDataSet for normal FileDP not implemented";};
    virtual int open(){fin.open(fname); eof=false;return 0;};
    virtual int close(){fin.close();return 0;};
};

// label features

class RidFileDP:public DataProvider
{
private:
    std::string fname;
    std::ifstream fin;
    DataList d;
    bool read;
    int pos;
    int qid;
public:
    RidFileDP(std::string fn=""):fname(fn){read=false;};
    void readEntries();
    int getfSize() { if(!read) readEntries(); return d.getfSize();};
    int getpSize();
    void shuffle(std::vector<DataEntry*> &dat);
    virtual void getAllDataSet(RidList &out);
    virtual int getDataSet(DataList &out);
    virtual int open(){fin.open(fname); eof=false;return 0;};
    virtual int close(){fin.close(); d.clear();return 0;};
    void take(int n,std::vector<DataEntry*> &a,std::vector<DataEntry*> &b);
    void getRidVector(std::vector<DataEntry*> &rid){
        if (!read)
            readEntries();
        rid.clear();
        std::vector<DataEntry*> &dat = d.getData();
        for (int i=0;i<dat.size();++i)
            rid.push_back(dat[i]);
    }
};

#endif