forked from taku910/crfpp
-
Notifications
You must be signed in to change notification settings - Fork 11
/
Copy pathlbfgs.h
114 lines (100 loc) · 2.93 KB
/
lbfgs.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
//
// CRF++ -- Yet Another CRF toolkit
//
// $Id: lbfgs.h 1588 2007-02-12 09:03:39Z taku $;
//
// Copyright(C) 2005-2007 Taku Kudo <taku@chasen.org>
//
#ifndef CRFPP_LBFGS_H_
#define CRFPP_LBFGS_H_
#include <cmath>
#include <vector>
#include <iostream>
namespace CRFPP {
class LBFGS {
private:
class Mcsrch;
int iflag_, iscn, nfev, iycn, point, npt;
int iter, info, ispt, isyt, iypt, maxfev;
double stp, stp1;
std::vector <double> diag_;
std::vector <double> w_;
std::vector <double> v_;
std::vector <double> xi_;
Mcsrch *mcsrch_;
void pseudo_gradient(int size,
double *v,
double *x,
const double *g,
double C);
void lbfgs_optimize(int size,
int msize,
double *x,
double f,
const double *g,
double *diag,
double *w, bool orthant,
double C, double *v, double *xi, int *iflag);
public:
explicit LBFGS(): iflag_(0), iscn(0), nfev(0), iycn(0),
point(0), npt(0), iter(0), info(0),
ispt(0), isyt(0), iypt(0), maxfev(0),
stp(0.0), stp1(0.0), mcsrch_(0) {}
virtual ~LBFGS() { clear(); }
void clear();
// This is old interface for backward compatibility
// ignore msize |m|
int init(int n, int m) {
static const int msize = 5;
const size_t size = n;
iflag_ = 0;
w_.resize(size * (2 * msize + 1) + 2 * msize);
diag_.resize(size);
v_.resize(size);
return 0;
}
// old interface
int optimize(double *x, double *f, double *g) {
return optimize(diag_.size(), x, *f, g, false, 1.0);
}
// Use this interface
int optimize(size_t size, double *x, double f,
double *g, bool orthant, double C) {
static const int msize = 5;
if (w_.empty()) {
iflag_ = 0;
w_.resize(size * (2 * msize + 1) + 2 * msize);
diag_.resize(size);
v_.resize(size);
if (orthant) {
xi_.resize(size);
}
} else if (diag_.size() != size || v_.size() != size) {
std::cerr << "size of array is different" << std::endl;
return -1;
} else if (orthant && v_.size() != size) {
std::cerr << "size of array is different" << std::endl;
return -1;
}
if (orthant) {
lbfgs_optimize(static_cast<int>(size),
msize, x, f, g, &diag_[0], &w_[0], orthant,
C, &v_[0], &xi_[0], &iflag_);
} else {
lbfgs_optimize(static_cast<int>(size),
msize, x, f, g, &diag_[0], &w_[0], orthant,
C, g, &xi_[0], &iflag_);
}
if (iflag_ < 0) {
std::cerr << "routine stops with unexpected error" << std::endl;
return -1;
}
if (iflag_ == 0) {
clear();
return 0; // terminate
}
return 1; // evaluate next f and g
}
};
}
#endif