~ubuntu-branches/ubuntu/wily/vowpal-wabbit/wily

Committer: Bazaar Package Importer
Author(s): Yaroslav Halchenko
Date: 2010-12-05 09:50:55 UTC
mfrom: (1.1.1 upstream)
Revision ID: james.westby@ubuntu.com-20101205095055-o8f7gb0kg145tmst

Tags: 5.0-1

* New upstream release
* DEP-5 copyright file
* Boosted policy to 3.9.1 -- removed reference to BSD-3 file from copyright
* Explicitly build vw.1 target

files added:
active_interactor.cc

cg.cc

cg.h

lda.cc

lda.h

test/RunTests

test/pred-sets

test/pred-sets/ref

test/pred-sets/ref/0001.predict

test/test-sets

test/test-sets/0001.dat

test/test-sets/ref

test/test-sets/ref/0001.stderr

test/test-sets/ref/0001.stdout

test/train-sets

test/train-sets/0001.dat

test/train-sets/0002.dat

test/train-sets/ref

test/train-sets/ref/0001.stderr

test/train-sets/ref/0001.stdout

test/train-sets/ref/0002.stderr

test/train-sets/ref/0002.stdout

test/train-sets/ref/0002a.stderr

test/train-sets/ref/0002a.stdout

utl/vw-convergence

files removed:
.pc

.pc/.version

.pc/applied-patches

.pc/debian-changes-4.1+20100420-1

.pc/debian-changes-4.1+20100420-1/cluster_command

debian/patches

debian/patches/debian-changes-4.1+20100420-1

debian/patches/series

test/test.dat

test/train.dat

files modified:
.gitignore

Makefile

cache.cc

cluster_command

debian/changelog

debian/control

debian/copyright

debian/rules

delay_ring.cc

delay_ring.h

example.h

gd.cc

gd.h

global_data.cc

global_data.h

loss_functions.cc

loss_functions.h

main.cc

message_relay.cc

message_relay.h

multisource.cc

multisource.h

network.cc

noop.cc

parse_args.cc

parse_args.h

parse_example.cc

parse_example.h

parse_regressor.cc

parse_regressor.h

parser.cc

parser.h

sender.cc

sender.h

simple_label.cc

simple_label.h

sparse_dense.cc

sparse_dense.h

test/README

v_array.h

vw.cc

Show diffs side-by-side

added added

removed removed

loss_functions.cc

using namespace std;

#include "loss_functions.h"

#include "global_data.h"

class squaredloss : public loss_function {

public:

squaredloss() {

}

double getLoss(double prediction, double label) {

double example_loss = (prediction - label) * (prediction - label);

return example_loss;

}

double getUpdate(double prediction, double label) {

return (label - prediction);

}

};

squaredloss() {

}

float getLoss(float prediction, float label) {

float example_loss = (prediction - label) * (prediction - label);

return example_loss;

}

float getUpdate(float prediction, float label,float eta_t, float norm) {

if (eta_t < 1e-6){

/* When exp(-eta_t)~= 1 we replace 1-exp(-eta_t)

* with its first order Taylor expansion around 0

* to avoid catastrophic cancellation.

return (label - prediction)*eta_t/norm;

}

return (label - prediction)*(1-exp(-eta_t))/norm;

}

float getRevertingWeight(float prediction, float eta_t){

float t = 0.5*(global.min_label+global.max_label);

float alternative = (prediction > t) ? global.min_label : global.max_label;

return log((alternative-prediction)/(alternative-t))/eta_t;

}

float getSquareGrad(float prediction, float label) {

return (prediction - label) * (prediction - label);

}

float first_derivative(float prediction, float label)

{

return 2. * (prediction-label);

}

float second_derivative(float prediction, float label)

{

return 2.;

}

};

class classic_squaredloss : public loss_function {

public:

classic_squaredloss() {

}

float getLoss(float prediction, float label) {

float example_loss = (prediction - label) * (prediction - label);

return example_loss;

}

float getUpdate(float prediction, float label,float eta_t, float norm) {

return eta_t*(label - prediction)/norm;

}

float getRevertingWeight(float prediction, float eta_t){

float t = 0.5*(global.min_label+global.max_label);

float alternative = (prediction > t) ? global.min_label : global.max_label;

return (t-prediction)/((alternative-prediction)*eta_t);

}

float getSquareGrad(float prediction, float label) {

return (prediction - label) * (prediction - label);

}

float first_derivative(float prediction, float label)

{

return 2. * (prediction-label);

}

float second_derivative(float prediction, float label)

{

return 2.;

}

};

class hingeloss : public loss_function {

public:

hingeloss() {

}

double getLoss(double prediction, double label) {

double e = 1 - label*prediction;

return (e > 0) ? e : 0;

}

double getUpdate(double prediction, double label) {

if(prediction == label) return 0;

return label;

}

hingeloss() {

}

float getLoss(float prediction, float label) {

float e = 1 - label*prediction;

return (e > 0) ? e : 0;

}

100

101

float getUpdate(float prediction, float label,float eta_t, float norm) {

102

if(label*prediction >= label*label) return 0;

103

float s1=(label*label-label*prediction)/(label*label);

104

float s2=eta_t;

105

return label * (s1<s2 ? s1 : s2)/norm;

106

}

107

108

float getRevertingWeight(float prediction, float eta_t){

109

return fabs(prediction)/eta_t;

110

}

111

112

float getSquareGrad(float prediction, float label) {

113

return first_derivative(prediction,label);

114

}

115

116

float first_derivative(float prediction, float label)

117

{

118

return (label*prediction >= label*label) ? 0 : -label;

119

}

120

121

float second_derivative(float prediction, float label)

122

{

123

return 0.;

124

}

125

};

126

127

class logloss : public loss_function {

128

public:

logloss() {

}

double getLoss(double prediction, double label) {

return log(1 + exp(-label * prediction));

}

double getUpdate(double prediction, double label) {

double d = exp(-label * prediction);

return label * d / (1 + d);

}

129

logloss() {

130

131

}

132

133

float getLoss(float prediction, float label) {

134

return log(1 + exp(-label * prediction));

135

}

136

137

float getUpdate(float prediction, float label, float eta_t, float norm) {

138

float w,x;

139

float d = exp(label * prediction);

140

if(eta_t < 1e-6){

141

/* As with squared loss, for small eta_t we replace the update

142

* with its first order Taylor expansion to avoid numerical problems

143

144

return label*eta_t/((1+d)*norm);

145

}

146

x = eta_t + label*prediction + d;

147

w = wexpmx(x);

148

return -(label*w+prediction)/norm;

149

}

150

151

inline float wexpmx(float x){

152

/* This piece of code is approximating W(exp(x))-x.

153

* W is the Lambert W function: W(z)*exp(W(z))=z.

154

* The absolute error of this approximation is less than 9e-5.

155

* Faster/better approximations can be substituted here.

156

157

double w = x>=1. ? 0.86*x+0.01 : exp(0.8*x-0.65); //initial guess

158

double r = x>=1. ? x-log(w)-w : 0.2*x+0.65-w; //residual

159

double t = 1.+w;

160

double u = 2.*t*(t+2.*r/3.); //magic

161

return w*(1.+r/t*(u-r)/(u-2.*r))-x; //more magic

162

}

163

164

float getRevertingWeight(float prediction, float eta_t){

165

float z = -fabs(prediction);

166

return (1-z-exp(z))/eta_t;

167

}

168

169

float first_derivative(float prediction, float label)

170

{

171

float v = - label/(1+exp(label * prediction));

172

return v;

173

}

174

175

float getSquareGrad(float prediction, float label) {

176

float d = first_derivative(prediction,label);

177

return d*d;

178

}

179

180

float second_derivative(float prediction, float label)

181

{

182

float e = exp(label*prediction);

183

184

return label*label*e/((1+e)*(1+e));

185

}

186

};

187

188

class quantileloss : public loss_function {

189

public:

quantileloss(double &tau_) : tau(tau_) {

}

double getLoss(double prediction, double label) {

double e = label - prediction;

if(e > 0) {

return tau * e;

} else {

return -(1 - tau) * e;

}

double getUpdate(double prediction, double label) {

double e = label - prediction;

if(e == 0) return 0;

if(e > 0) {

return tau;

} else {

return -(1 - tau);

}

double tau;

190

quantileloss(double &tau_) : tau(tau_) {

191

}

192

193

float getLoss(float prediction, float label) {

194

float e = label - prediction;

195

if(e > 0) {

196

return tau * e;

197

} else {

198

return -(1 - tau) * e;

199

}

200

201

}

202

203

float getUpdate(float prediction, float label, float eta_t, float norm) {

204

float s2;

205

float e = label - prediction;

206

if(e == 0) return 0;

207

float s1=eta_t;

208

if(e > 0) {

209

s2=e/tau;

210

return tau*(s1<s2?s1:s2)/norm;

211

} else {

212

s2=-e/(1-tau);

213

return -(1 - tau)*(s1<s2?s1:s2)/norm;

214

}

215

}

216

217

float getRevertingWeight(float prediction, float eta_t){

218

float v,t;

219

t = 0.5*(global.min_label+global.max_label);

220

if(prediction > t)

221

v = -(1-tau);

222

else

223

v = tau;

224

return (t - prediction)/(eta_t*v);

225

}

226

227

float first_derivative(float prediction, float label)

228

{

229

float e = label - prediction;

230

if(e == 0) return 0;

231

return e > 0 ? -tau : (1-tau);

232

}

233

234

float getSquareGrad(float prediction, float label) {

235

float fd = first_derivative(prediction,label);

236

return fd*fd;

237

}

238

239

float second_derivative(float prediction, float label)

240

{

241

return 0.;

242

}

243

244

double tau;

245

};

246

247

loss_function* getLossFunction(string funcName, double function_parameter) {

if(funcName.compare("squared") == 0) {

return new squaredloss();

} else if(funcName.compare("hinge") == 0) {

return new hingeloss();

} else if(funcName.compare("logistic") == 0) {

return new logloss();

} else if(funcName.compare("quantile") == 0 || funcName.compare("pinball") == 0 || funcName.compare("absolute") == 0) {

return new quantileloss(function_parameter);

100

} else {

101

cout << "Invalid loss function name: " << funcName << " Bailing!" << endl;

102

exit(1);

103

}

248

if(funcName.compare("squared") == 0) {

249

return new squaredloss();

250

} else if(funcName.compare("classic") == 0){

251

return new classic_squaredloss();

252

} else if(funcName.compare("hinge") == 0) {

253

return new hingeloss();

254

} else if(funcName.compare("logistic") == 0) {

255

global.min_label = -100;

256

global.max_label = 100;

257

return new logloss();

258

} else if(funcName.compare("quantile") == 0 || funcName.compare("pinball") == 0 || funcName.compare("absolute") == 0) {

259

return new quantileloss(function_parameter);

260

} else {

261

cout << "Invalid loss function name: \'" << funcName << "\' Bailing!" << endl;

262

exit(1);

263

}

104

264

cout << "end getLossFunction" << endl;

105

265

}

Older »