mirror of
https://github.com/BlackLight/Voxifera.git
synced 2024-11-27 21:55:12 +01:00
193 lines
4.3 KiB
C
193 lines
4.3 KiB
C
#include "vocal.h"
|
|
|
|
typedef enum { capture, append } mode;
|
|
|
|
void helpandusage() {
|
|
fprintf (stderr,
|
|
"---=== BlackLight's vocal recognition v.0.1b ===---\n"
|
|
"author @ blacklight@autistici.org\n\n"
|
|
"Usage: vocal [-d <device>] [-a] [-c <file>] [-h]\n\n"
|
|
"\t-d <device>\tUse a different device instead the default one (/dev/dsp)\n"
|
|
"\t-a\t\tAppend a new vocal sample with an associated command\n"
|
|
"\t-c <file>\tUse a different rc file (default: ~/.vocalrc)\n"
|
|
"\t-h\t\tPrint this help and exit\n"
|
|
);
|
|
}
|
|
|
|
int main (int argc, char **argv) {
|
|
int i, j, dsp, fd, ch, size, recognized;
|
|
int TOTSIZE = BUF_SIZE*SAMPLE_SIZE;
|
|
|
|
char *line, *tmp, *cmd = NULL, *fname = NULL, device = NULL;
|
|
char **match = NULL;
|
|
|
|
double deviance;
|
|
double *neutral, *trans;
|
|
double value, sum = 0.0;
|
|
double PIconst = (D_M_PI/TOTSIZE);
|
|
double coeff = 1.0 / TOTSIZE;
|
|
double t, v;
|
|
|
|
FILE *fp;
|
|
time_t t1, t2;
|
|
|
|
u8 *buf;
|
|
mode m = capture;
|
|
|
|
while ((ch=getopt(argc, argv, "ahc:d:"))>0) {
|
|
switch(ch){
|
|
case 'd' : device = strdup(optarg); break;
|
|
case 'a' : m = append; break;
|
|
case 'c' : fname = strdup(optarg); break;
|
|
case 'h' : helpandusage();
|
|
return 0; break;
|
|
default :
|
|
helpandusage();
|
|
return 1;
|
|
}
|
|
}
|
|
|
|
buf = (u8*) malloc(TOTSIZE);
|
|
neutral = (double*) malloc(TOTSIZE*sizeof(double));
|
|
trans = (double*) malloc(TOTSIZE*sizeof(double));
|
|
memset(buf, 0x80, TOTSIZE);
|
|
|
|
if (!fname) {
|
|
fname = (char*) malloc(0x100);
|
|
snprintf (fname, 0x100, "%s/.vocalrc", getenv("HOME"));
|
|
}
|
|
|
|
if ((fd=open("neutral.ft", O_RDONLY, 0644))<0) {
|
|
perror ("could not find file neutral.ft");
|
|
return 1;
|
|
}
|
|
|
|
read (fd, neutral, TOTSIZE*sizeof(double));
|
|
close(fd);
|
|
|
|
if ((dsp = init_dsp( device ))<0)
|
|
return 1;
|
|
|
|
memset (buf, 0x0, TOTSIZE);
|
|
printf ("now capturing, say something...\n");
|
|
|
|
if (read(dsp, buf, TOTSIZE) != TOTSIZE) {
|
|
perror("read the wrong number of bytes");
|
|
return 1;
|
|
}
|
|
|
|
close(dsp);
|
|
|
|
printf ("capture done, computing DCT...\n");
|
|
int count = 0;
|
|
t1 = time((unsigned) NULL);
|
|
|
|
for (i=0; i<TOTSIZE; ++i) {
|
|
t = PIconst*i;
|
|
v = 0.0;
|
|
|
|
for (j=0; j<TOTSIZE; ++j) {
|
|
if (t && j)
|
|
v += buf[j] * cos(t*j);
|
|
else
|
|
v += buf[j];
|
|
|
|
if (t*j < D_M_PI)
|
|
count++;
|
|
}
|
|
|
|
v *= coeff;
|
|
v -= neutral[i];
|
|
v = (v >= 0) ? v : -v;
|
|
trans[i] = log(v);
|
|
}
|
|
|
|
free(neutral);
|
|
free(buf);
|
|
|
|
t2 = time((unsigned) NULL);
|
|
printf ("DCT computing: done in %u seconds\n", (unsigned int) (t2-t1));
|
|
printf ("%d arg < 2*pi\n", count);
|
|
|
|
for (i=0; i<TOTSIZE; i++)
|
|
sum += trans[i];
|
|
sum = exp(sum/100000.0);
|
|
free(trans);
|
|
|
|
printf ("vocal sequence successfully acquired, Fourier sum = %g\n", sum);
|
|
|
|
if (m == append) {
|
|
printf ("which command would you like to associate for this vocal sequence? ");
|
|
cmd = getline(stdin);
|
|
|
|
if (!(fp=fopen(fname,"a"))) {
|
|
perror ("Unable to open configuration file");
|
|
return 1;
|
|
}
|
|
|
|
fprintf (fp, "%s: %g\n", cmd, sum);
|
|
fclose(fp);
|
|
free(cmd);
|
|
printf ("sequence successfully saved\n");
|
|
} else {
|
|
if (!(fp=fopen(fname,"r"))) {
|
|
perror ("Unable to open configuration file");
|
|
return 1;
|
|
}
|
|
|
|
recognized=0;
|
|
|
|
for (i=1; (line=getline(fp)) && !feof(fp); i++) {
|
|
if ((match=preg_match("^.+:\\s", line, &size))) {
|
|
tmp = strdup(match[0]);
|
|
tmp[strlen(match[0])-2] = 0;
|
|
|
|
if ((match=preg_match(":\\s.+$", line, &size))) {
|
|
for (j=2; j<strlen(match[0]); j++)
|
|
match[0][j-2] = match[0][j];
|
|
|
|
match[j-2]=0;
|
|
value = atof(match[0]);
|
|
|
|
if (ABS(ABS(value)-ABS(sum)) <= 0.025) {
|
|
if (!recognized) {
|
|
deviance = ABS(ABS(value)-ABS(sum));
|
|
cmd = strdup(tmp);
|
|
recognized=1;
|
|
} else {
|
|
if (ABS(ABS(value)-ABS(sum)) < deviance) {
|
|
deviance = ABS(ABS(value)-ABS(sum));
|
|
cmd = strdup(tmp);
|
|
}
|
|
}
|
|
}
|
|
} else {
|
|
fprintf (stderr, "Parse error at %s:%d\n", fname, i);
|
|
return 1;
|
|
}
|
|
|
|
free(tmp);
|
|
} else {
|
|
fprintf (stderr, "Parse error at %s:%d\n", fname, i);
|
|
return 1;
|
|
}
|
|
}
|
|
|
|
if (recognized) {
|
|
printf ("value = %g, deviance = %g: vocal command recognized: %s\n",
|
|
value, deviance, cmd);
|
|
|
|
cmd = (char*) realloc(cmd, strlen(cmd)+3);
|
|
sprintf (cmd, "%s &", cmd);
|
|
system (cmd);
|
|
free(cmd);
|
|
} else
|
|
printf ("I'm sorry, I'm not smart enough to understand what you said :(\n");
|
|
}
|
|
|
|
if (fname)
|
|
free(fname);
|
|
|
|
return 0;
|
|
}
|
|
|