00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013
00014
00015
00016
00017
00018
00019
00020
00021
00022
00023
00024
00025
00026
00027
00028
00029
00030
00031
00032
00033
00034
00035
00036
00037
00038
00039
00040
00041
00042
00043
#include "CrossEntropyVariable.h"
00044
00045
namespace PLearn {
00046
using namespace std;
00047
00048
00049
00052
PLEARN_IMPLEMENT_OBJECT(CrossEntropyVariable,
00053
"cost = - sum_i {target_i * log(output_i) + (1-target_i) * log(1-output_i)}",
00054
"NO HELP");
00055
00056 CrossEntropyVariable::CrossEntropyVariable(
Variable* netout,
Variable* target)
00057 :
inherited(netout,target,1,1)
00058 {
00059
build_();
00060 }
00061
00062
void
00063 CrossEntropyVariable::build()
00064 {
00065 inherited::build();
00066
build_();
00067 }
00068
00069
void
00070 CrossEntropyVariable::build_()
00071 {
00072
00073
if (input1 && input2 && (input1->size() != input2->size()))
00074
PLERROR(
"In CrossEntropyVariable: netout and target must have the same size");
00075 }
00076
00077
00078 void CrossEntropyVariable::recomputeSize(
int& l,
int& w)
const
00079
{ l=1, w=1; }
00080
00081
00082 void CrossEntropyVariable::fprop()
00083 {
00084
real cost = 0.0;
00085
for (
int i=0; i<input1->size(); i++)
00086 {
00087
real output = input1->valuedata[i];
00088
real target = input2->valuedata[i];
00089
if ((output == 0.0 && target != 0) || (output == 1.0 && target != 1))
00090
PLERROR(
"CrossEntropyVariable::fprop: model output is either exactly "
00091
"0.0 or 1.0; cannot compute cost function");
00092
if (output != 0 && output != 1) {
00093 cost += target*
log(output) + (1.0-target)*
log(1.0-output);
00094 }
00095 }
00096 valuedata[0] = -cost;
00097 }
00098
00099
00100 void CrossEntropyVariable::bprop()
00101 {
00102
real gr = *gradientdata;
00103
for (
int i=0; i<input1->size(); i++)
00104 {
00105
real output = input1->valuedata[i];
00106
real target = input2->valuedata[i];
00107
#ifdef BOUNDCHECK
00108
if (output == target)
00109
PLERROR(
"CrossEntropyVariable::bprop: model output is either exactly "
00110
"0.0 or 1.0; cannot compute bprop");
00111
#endif
00112
input1->gradientdata[i] += gr*(-target/output + (1.0-target)/(1.0-output));
00113 }
00114 }
00115
00116
00117 }
00118
00119