|
1 | 1 | #include "ggml.h"
|
2 | 2 | #include <vector>
|
3 |
| -#include <assert.h> |
| 3 | +#include <cassert> |
4 | 4 | #include <random>
|
5 |
| -#include <string.h> |
6 |
| - |
7 |
| -#undef MIN |
8 |
| -#undef MAX |
9 |
| -#define MIN(a, b) ((a) < (b) ? (a) : (b)) |
10 |
| -#define MAX(a, b) ((a) > (b) ? (a) : (b)) |
| 5 | +#include <cstring> |
11 | 6 |
|
12 | 7 | float frand() {
|
13 | 8 | return (float)rand()/(float)RAND_MAX;
|
@@ -1068,7 +1063,7 @@ void get_example_targets(int example_id, struct ggml_tensor * tokens_input, stru
|
1068 | 1063 | float z = (y+1.0f)*0.5f; // scale to [0..1]
|
1069 | 1064 | z += (frand()-0.5f)*(randomness/n_vocab);
|
1070 | 1065 | z = (z < 0.0f) ? 0.0f : (z > 1.0f) ? 1.0f : z; // clamp to [0..1]
|
1071 |
| - int token = MAX(1,MIN(1+(int)(z*(float)(n_vocab-1)), n_vocab-1)); |
| 1066 | + int token = std::max(1,std::min(1+(int)(z*(float)(n_vocab-1)), n_vocab-1)); |
1072 | 1067 | ggml_set_f32_1d(targets, (i-1)*n_vocab + token, +1.0f);
|
1073 | 1068 | if (i<n_tokens) {
|
1074 | 1069 | ggml_set_i32_1d(tokens_input, i, token);
|
@@ -1119,7 +1114,7 @@ int main(int argc, char ** argv) {
|
1119 | 1114 | model.hparams.n_mult = 2;
|
1120 | 1115 | model.hparams.n_head = 8;
|
1121 | 1116 | model.hparams.n_layer = 1;
|
1122 |
| - model.hparams.n_rot = MIN(16, model.hparams.n_embd / model.hparams.n_head); |
| 1117 | + model.hparams.n_rot = std::min(16u, model.hparams.n_embd / model.hparams.n_head); |
1123 | 1118 |
|
1124 | 1119 | // model.hparams.n_embd = 32;
|
1125 | 1120 | // model.hparams.n_mult = 2;
|
@@ -1225,12 +1220,12 @@ int main(int argc, char ** argv) {
|
1225 | 1220 | // struct ggml_tensor * e = cross_entropy_loss(ctx0, targets1, logits1);
|
1226 | 1221 | // struct ggml_tensor * e = square_error_loss(ctx0, targets1, logits1);
|
1227 | 1222 |
|
1228 |
| - // struct ggml_tensor * e = ggml_add(ctx0, |
1229 |
| - // square_error_loss(ctx0, targets1, logits1), |
1230 |
| - // square_error_loss(ctx0, targets2, logits2)); |
1231 | 1223 | struct ggml_tensor * e = ggml_add(ctx0,
|
1232 |
| - cross_entropy_loss(ctx0, targets1, logits1), |
1233 |
| - cross_entropy_loss(ctx0, targets2, logits2)); |
| 1224 | + square_error_loss(ctx0, targets1, logits1), |
| 1225 | + square_error_loss(ctx0, targets2, logits2)); |
| 1226 | + // struct ggml_tensor * e = ggml_add(ctx0, |
| 1227 | + // cross_entropy_loss(ctx0, targets1, logits1), |
| 1228 | + // cross_entropy_loss(ctx0, targets2, logits2)); |
1234 | 1229 | // struct ggml_tensor * e = ggml_add(ctx0,
|
1235 | 1230 | // ggml_add(ctx0,
|
1236 | 1231 | // cross_entropy_loss(ctx0, targets1, logits1),
|
|
0 commit comments