analistica/ex-7/main.c

111 lines
3.1 KiB
C
Raw Normal View History

2020-03-06 02:24:32 +01:00
#include <stdio.h>
2020-03-06 11:54:28 +01:00
#include <string.h>
#include "fisher.h"
2020-03-06 19:46:42 +01:00
#include "percep.h"
2020-03-06 11:54:28 +01:00
/* Options for the program */
struct options {
char *mode;
size_t nsig;
size_t nnoise;
2020-03-06 19:46:42 +01:00
int iter;
2020-03-06 02:24:32 +01:00
};
2020-03-06 11:54:28 +01:00
int main(int argc, char **argv) {
/* Set default options */
struct options opts;
opts.mode = "fisher";
opts.nsig = 800;
opts.nnoise = 1000;
2020-03-06 19:46:42 +01:00
opts.iter = 5;
2020-03-06 11:54:28 +01:00
/* Process CLI arguments */
for (size_t i = 1; i < argc; i++) {
if (!strcmp(argv[i], "-m")) opts.mode = argv[++i];
else if (!strcmp(argv[i], "-s")) opts.nsig = atol(argv[++i]);
else if (!strcmp(argv[i], "-n")) opts.nnoise = atol(argv[++i]);
2020-03-06 19:46:42 +01:00
else if (!strcmp(argv[i], "-i")) opts.nnoise = atoi(argv[++i]);
2020-03-06 11:54:28 +01:00
else {
fprintf(stderr, "Usage: %s -[hiIntp]\n", argv[0]);
fprintf(stderr, "\t-h\tShow this message.\n");
fprintf(stderr, "\t-m MODE\tThe disciminant to use: 'fisher' for "
"Fisher linear discriminant, 'percep' for perceptron.\n");
2020-03-06 19:46:42 +01:00
fprintf(stderr, "\t-i N\tThe number of training iterations (for perceptron).\n");
2020-03-06 11:54:28 +01:00
fprintf(stderr, "\t-n N\tThe number of events in noise class.\n");
return EXIT_FAILURE;
}
2020-03-06 02:24:32 +01:00
}
// initialize RNG
gsl_rng_env_setup();
gsl_rng *r = gsl_rng_alloc(gsl_rng_default);
/* Generate two classes of normally
* distributed 2D points with different
* paramters: signal and noise.
*/
struct par par_sig = { 0, 0, 0.3, 0.3, 0.5 };
struct par par_noise = { 4, 4, 1.0, 1.0, 0.4 };
2020-03-06 11:54:28 +01:00
sample_t *signal = generate_normal(r, opts.nsig, &par_sig);
sample_t *noise = generate_normal(r, opts.nnoise, &par_noise);
2020-03-06 02:24:32 +01:00
2020-03-06 19:46:42 +01:00
gsl_vector *w;
double t_cut;
2020-03-06 11:54:28 +01:00
if (!strcmp(opts.mode, "fisher")) {
/* Fisher linear discriminant
*
* First calculate the direction w onto
* which project the data points. Then the
* cut which determines the class for each
* projected point.
*/
fputs("# Linear Fisher discriminant\n\n", stderr);
2020-03-06 19:46:42 +01:00
double ratio = opts.nsig / (double)opts.nnoise;
w = fisher_proj(signal, noise);
t_cut = fisher_cut(ratio, w, signal, noise);
2020-03-06 11:54:28 +01:00
}
2020-03-06 19:46:42 +01:00
else if (!strcmp(opts.mode, "percep")) {
/* Perceptron
*
* Train a single perceptron on the
* dataset to get an approximate
* solution in `iter` iterations.
*/
fputs("# Perceptron \n\n", stderr);
w = percep_train(signal, noise, opts.iter, &t_cut);
}
else {
fputs("\n\nerror: invalid mode. select either"
" 'fisher' or 'percep'\n", stderr);
return EXIT_FAILURE;
}
/* Print the results of the method
* selected: weights and threshold.
*/
fprintf(stderr, "* w: [%.3f, %.3f]\n",
gsl_vector_get(w, 0),
gsl_vector_get(w, 1));
fprintf(stderr, "* t_cut: %.3f\n", t_cut);
gsl_vector_fprintf(stdout, w, "%g");
printf("%f\n", t_cut);
2020-03-06 02:24:32 +01:00
/* Print data to stdout for plotting.
2020-03-06 11:54:28 +01:00
* Note: we print the sizes to be able
2020-03-06 02:24:32 +01:00
* to set apart the two matrices.
*/
2020-03-06 11:54:28 +01:00
printf("%ld %ld %d\n", opts.nsig, opts.nnoise, 2);
2020-03-06 02:24:32 +01:00
gsl_matrix_fprintf(stdout, signal->data, "%g");
gsl_matrix_fprintf(stdout, noise->data, "%g");
// free memory
gsl_rng_free(r);
sample_t_free(signal);
sample_t_free(noise);
return EXIT_SUCCESS;
}