|
28 | 28 | #ifndef STD_CONF_H |
29 | 29 | #define STD_CONF_H |
30 | 30 |
|
31 | | -#define NEURONS 128 |
| 31 | +#define NEURONS 128 |
32 | 32 |
|
33 | | -#define STD_LEARNING_RATE 0.001 |
34 | | -#define STD_MOMENTUM 0.0 |
35 | | -#define STD_LAMBDA 0.05 |
36 | | -#define SOFTMAX_TEMP 1.0 |
37 | | -#define GRADIENT_CLIP_LIMIT 5.0 |
38 | | -#define MINI_BATCH_SIZE 100 |
39 | | -#define LOSS_MOVING_AVG 0.01 |
| 33 | +#define STD_LEARNING_RATE 0.001 |
| 34 | +#define STD_MOMENTUM 0.0 |
| 35 | +#define STD_LAMBDA 0.05 |
| 36 | +#define SOFTMAX_TEMP 1.0 |
| 37 | +#define GRADIENT_CLIP_LIMIT 5.0 |
| 38 | +#define MINI_BATCH_SIZE 100 |
| 39 | +#define LOSS_MOVING_AVG 0.01 |
40 | 40 |
|
41 | | -#define LAYERS 3 |
| 41 | +#define LAYERS 3 // Has a tremendous impact on avaiable memory |
42 | 42 |
|
43 | | -#define STATEFUL 1 |
| 43 | +#define STATEFUL 1 |
44 | 44 |
|
45 | | -#define GRADIENTS_CLIP 1 |
46 | | -#define GRADIENTS_FIT 0 |
| 45 | +#define GRADIENTS_CLIP 1 |
| 46 | +#define GRADIENTS_FIT 0 |
47 | 47 |
|
48 | | -#define MODEL_REGULARIZE 0 |
| 48 | +#define MODEL_REGULARIZE 0 |
49 | 49 |
|
50 | | -#define DECREASE_LR 0 // set to 0 to disable decreasing learning rate |
| 50 | +#define DECREASE_LR 0 // set to 0 to disable decreasing learning rate |
51 | 51 |
|
52 | | -#define STD_LEARNING_RATE_DECREASE 100000 |
53 | | -#define STD_NUMBER_OF_NO_RECORD_ITERATIONS_UNTIL_LR_DECREASE 1000000 |
| 52 | +#define STD_LEARNING_RATE_DECREASE 100000 |
| 53 | +#define STD_NUMBER_OF_NO_RECORD_ITERATIONS_UNTIL_LR_DECREASE 1000000 |
54 | 54 |
|
55 | 55 | /* |
56 | 56 | * These defines modify how the program interacts with the user |
57 | 57 | * of the program during the training phase. Here you can |
58 | 58 | * decide how often it should output its progress and wether or not |
59 | 59 | * it should write to file among other things. |
60 | 60 | */ |
61 | | -#define PRINT_EVERY_X_ITERATIONS 100 |
62 | | -#define STORE_EVERY_X_ITERATIONS 8000 |
63 | | -#define PRINT_PROGRESS 1 // set to 0 to disable printing |
64 | | -#define PRINT_SAMPLE_OUTPUT 1 // set to 0 to disable output sampling |
65 | | -#define PRINT_SAMPLE_OUTPUT_TO_FILE 0 // set to 0 to disable output sampling to file |
66 | | -#define PRINT_SAMPLE_OUTPUT_TO_FILE_ARG "a" // used as an argument to fopen (goes with "w" or "a") |
67 | | -#define PRINT_SAMPLE_OUTPUT_TO_FILE_NAME "progress_output.txt" // name of the file containing samples |
68 | | -#define STORE_PROGRESS_EVERY_X_ITERATIONS 1000 // set to 0 to disable writing loss value to file during training |
69 | | -#define PROGRESS_FILE_NAME "progress.csv" |
70 | | -#define NUMBER_OF_CHARS_TO_DISPLAY_DURING_TRAINING 200 |
| 61 | +#define PRINT_EVERY_X_ITERATIONS 100 |
| 62 | +#define STORE_EVERY_X_ITERATIONS 8000 |
| 63 | +#define PRINT_PROGRESS 1 // set to 0 to disable printing |
| 64 | +#define PRINT_SAMPLE_OUTPUT 1 // set to 0 to disable output sampling |
| 65 | +#define PRINT_SAMPLE_OUTPUT_TO_FILE 0 // set to 0 to disable output sampling to file |
| 66 | +#define PRINT_SAMPLE_OUTPUT_TO_FILE_ARG "a" // used as an argument to fopen (goes with "w" or "a") |
| 67 | +#define PRINT_SAMPLE_OUTPUT_TO_FILE_NAME "progress_output.txt" // name of the file containing samples |
| 68 | +#define STORE_PROGRESS_EVERY_X_ITERATIONS 1000 // set to 0 to disable writing loss value to file during training |
| 69 | +#define PROGRESS_FILE_NAME "progress.csv" |
| 70 | +#define NUMBER_OF_CHARS_TO_DISPLAY_DURING_TRAINING 200 |
71 | 71 |
|
72 | 72 | /* |
73 | 73 | * Once the network has been trained it is stored to these files. |
|
77 | 77 | * but not by the interactive HTML application. |
78 | 78 | * For that, the .json program is intended to be used. |
79 | 79 | */ |
80 | | -#define STD_LOADABLE_NET_NAME "lstm_net.net" |
81 | | -#define STD_JSON_NET_NAME "lstm_net.json" |
| 80 | +#define STD_LOADABLE_NET_NAME "lstm_net.net" |
| 81 | +#define STD_JSON_NET_NAME "lstm_net.json" |
82 | 82 |
|
83 | 83 | // ================== DO NOT CHANGE THE FOLLOWING DEFINES ====================== |
84 | 84 | // Don't change this one, else the HTML application will not work. |
85 | | -#define JSON_KEY_NAME_SET "Feature mapping" |
| 85 | +#define JSON_KEY_NAME_SET "Feature mapping" |
86 | 86 | // This define should be undeffed, it was defined during experimentation |
87 | 87 | // #define INTERLAYER_SIGMOID_ACTIVATION |
88 | 88 | // ============================================================================= |
|
0 commit comments