//------------------------------------------------------------------------------
// name: mosaic-synth-osc-kb.ck (v1.3)
// desc: basic structure for a feature-based synthesizer
//       this particular version uses microphone as live input,
//       send OSC message to whoever listening (e.g., visuals)
//       and responds to keyboard input (1-9, f, d, c)
//
// version: need chuck version 1.4.2.1 or higher
// sorting: part of ChAI (ChucK for AI)
//
// USAGE: run with INPUT model file
//        > chuck mosaic-synth-osc-kb:file
//
// uncomment the next line to learn more about the KNN2 object:
// KNN2.help();
//
// date: Spring 2023
// authors: Ge Wang (https://ccrma.stanford.edu/~ge/)
//          Yikai Li
//------------------------------------------------------------------------------


// which keyboard to open (chuck --probe to available)
0 => int KB_DEVICE;

// input: pre-extracted model file
me.dir() + "features.txt" => string FEATURES_FILE;
// if have arguments, override filename
if( me.args() > 0 )
{
    me.arg(0) => FEATURES_FILE;
}
//------------------------------------------------------------------------------
// expected model file format; each VALUE is a feature value
// (feel free to adapt and modify the file format as needed)
//------------------------------------------------------------------------------
// filePath windowStartTime VALUE VALUE ... VALUE
// filePath windowStartTime VALUE VALUE ... VALUE
// ...
// filePath windowStartTime VALUE VALUE ... VALUE
//------------------------------------------------------------------------------


//------------------------------------------------------------------------------
// unit analyzer network: *** this must match the features in the features file
//------------------------------------------------------------------------------
// audio input into a FFT
adc => FFT fft;
// a thing for collecting multiple features into one vector
FeatureCollector combo => blackhole;
// add spectral feature: Centroid
fft =^ Centroid centroid =^ combo;
// add spectral feature: Flux
fft =^ Flux flux =^ combo;
// add spectral feature: RMS
fft =^ RMS rms =^ combo;
// add spectral feature: MFCC
fft =^ MFCC mfcc =^ combo;


//-----------------------------------------------------------------------------
// setting analysis parameters -- also should match what was used during extration
//-----------------------------------------------------------------------------
// set number of coefficients in MFCC (how many we get out)
// 13 is a commonly used value; using less here for printing
20 => mfcc.numCoeffs;
// set number of mel filters in MFCC
10 => mfcc.numFilters;

// do one .upchuck() so FeatureCollector knows how many total dimension
combo.upchuck();
// get number of total feature dimensions
combo.fvals().size() => int NUM_DIMENSIONS;

// set FFT size
4096*8 => fft.size;
// set window type and size
Windowing.hann(fft.size()) => fft.window;
// our hop size (how often to perform analysis)
(fft.size()/2)::samp => dur HOP;
// how many frames to aggregate before averaging?
// (this does not need to match extraction; might play with this number)
4 => int NUM_FRAMES;
// how much time to aggregate features for each file
fft.size()::samp * NUM_FRAMES => dur EXTRACT_TIME;


//------------------------------------------------------------------------------
// unit generator network: for real-time sound synthesis
//------------------------------------------------------------------------------
// how many max at any time?
8 => int NUM_VOICES;
// a number of audio buffers to cycel between
SndBuf buffers[NUM_VOICES]; ADSR envs[NUM_VOICES]; Pan2 pans[NUM_VOICES];
// set parameters
for( int i; i < NUM_VOICES; i++ )
{
    // connect audio
    buffers[i] => envs[i] => pans[i] => dac;
    // set chunk size (how to to load at a time)
    // this is important when reading from large files
    // if this is not set, SndBuf.read() will load the entire file immediately
    fft.size() => buffers[i].chunks;
    // randomize pan
    Math.random2f(-.75,.75) => pans[i].pan;
    // set envelope parameters
    envs[i].set( EXTRACT_TIME, EXTRACT_TIME/2, 1, EXTRACT_TIME );
}
1 => NUM_VOICES;


//------------------------------------------------------------------------------
// load feature data; read important global values like numPoints and numCoeffs
//------------------------------------------------------------------------------
// values to be read from file
0 => int numPoints; // number of points in data
0 => int numCoeffs; // number of dimensions in data
// file read PART 1: read over the file to get numPoints and numCoeffs
loadFile( FEATURES_FILE ) @=> FileIO @ fin;
// check
if( !fin.good() ) me.exit();
// check dimension at least
if( numCoeffs != NUM_DIMENSIONS )
{
    // error
    <<< "[error] expecting:", NUM_DIMENSIONS, "dimensions; but features file has:", numCoeffs >>>;
    // stop
    me.exit();
}


//------------------------------------------------------------------------------
// each Point corresponds to one line in the input file, which is one audio window
//------------------------------------------------------------------------------
class AudioWindow
{
    // unique point index (use this to lookup feature vector)
    int uid;
    // which file did this come file (in files arary)
    int fileIndex;
    // starting time in that file (in seconds)
    float windowTime;
    
    // set
    fun void set( int id, int fi, float wt )
    {
        id => uid;
        fi => fileIndex;
        wt => windowTime;
    }
}

// array of all points in model file
AudioWindow windows[numPoints];
// unique filenames; we will append to this
string files[0];
// map of filenames loaded
int filename2state[0];
// feature vectors of data points
float inFeatures[numPoints][numCoeffs];
// generate array of unique indices
int uids[numPoints]; for( int i; i < numPoints; i++ ) i => uids[i];

// use this for new input
//float features[NUM_FRAMES][numCoeffs];
// average values of coefficients across frames
//float featureMean[numCoeffs];


//------------------------------------------------------------------------------
// read the data
//------------------------------------------------------------------------------
readData( fin );


float reducedFeatures[numPoints][2];
PCA.reduce(inFeatures, 2, reducedFeatures);
[ 0., 0. ] @=> float dimMin[];
[ 0., 0. ] @=> float dimMax[];
// initialize
for( int i; i < dimMin.size(); i++ ) Math.FLOAT_MAX/2 => dimMin[i];
for( int i; i < dimMax.size(); i++ ) -Math.FLOAT_MAX/2 => dimMax[i];
for( int i; i < numPoints; i++)
{
    for( int j; j < 2; j++)
    {
        if(reducedFeatures[i][j] < dimMin[j]) reducedFeatures[i][j] => dimMin[j];
        if(reducedFeatures[i][j] > dimMax[j]) reducedFeatures[i][j] => dimMax[j];
    }
}
[(dimMin[0] + dimMax[0]) / 2., (dimMin[1] + dimMax[1]) / 2.] @=> float Zcur[];
//[(dimMin[0] + dimMax[0]) / 2., (dimMin[1] + dimMax[1]) / 2.] @=> float Zprev[];


79 => int KEY_RIGHT;
80 => int KEY_LEFT;
81 => int KEY_DOWN;
82 => int KEY_UP;
45 => int KEY_MINUS;
46 => int KEY_EQUAL;

//------------------------------------------------------------------------------
// set up our KNN object to use for classification
// (KNN2 is a fancier version of the KNN object)
// -- run KNN2.help(); in a separate program to see its available functions --
//------------------------------------------------------------------------------
KNN2 knn;
// k nearest neighbors
4 => int K;
// results vector (indices of k nearest points)
int knnResult[K];
// knn train
//knn.train( inFeatures, uids );
knn.train( reducedFeatures, uids );

// used to rotate sound buffers
0 => int which;

// key modes
1 => int PLAYBACK;
false => int MODE_CONCAT;

false => int MODE_LET_PLAY;
false => int MODE_FAVOR_CLOSEST_WINDOW;
AudioWindow @ CURR_WIN;


//------------------------------------------------------------------------------
// SYNTHESIS!!
// this function is meant to be sporked so it can be stacked in time
//------------------------------------------------------------------------------
fun void synthesize( int uid )
{
    // get the buffer to use
    buffers[which] @=> SndBuf @ sound;
    // get the envelope to use
    envs[which] @=> ADSR @ envelope;
    // increment and wrap if needed
    if (MODE_CONCAT) { which++; }
    if( which >= NUM_VOICES ) 0 => which;
    
    // get a referencde to the audio fragment to synthesize
    windows[uid] @=> AudioWindow @ win @=> CURR_WIN;
    // get filename
    files[win.fileIndex] => string filename;
    // load into sound buffer
    me.dir() + filename => sound.read;
    // playback rate 
    if (MODE_CONCAT) 
    { 
        Math.randomf() => float prob;
        if (prob >= (NUM_VOICES - 1.) / 10.) { 1. => sound.rate; }
        else { -1 => sound.rate; }
    }
    else { PLAYBACK => sound.rate; }
    // seek to the window start time
    ((win.windowTime::second)/samp) $ int => sound.pos;
    
    // print what we are about to play
    chout <= "synthesizing window (k=" <= K <= "|closest=" <= MODE_FAVOR_CLOSEST_WINDOW <= "): ";
    // print label
    chout <= win.uid <= "["
    <= win.fileIndex <= ":"
    <= win.windowTime <= ":position="
    <= sound.pos() <= "]";
    // endline
    chout <= IO.newline();
    
    // send window info to visualizer!
    if( !MODE_LET_PLAY) sendWindow( win.fileIndex, win.windowTime );
    
    // open the envelope, overlap add this into the overall audio
    envelope.keyOn();
    // wait
    (EXTRACT_TIME*3)-envelope.releaseTime() => now;
    // start the release
    envelope.keyOff();
    // wait
    envelope.releaseTime() => now;
}


// destination host name
"localhost" => string hostname;
// destination port number
12000 => int port;

// sender object
OscOut xmit;

// aim the transmitter at destination
xmit.dest( hostname, port );

// send OSC message: current file index and startTime, uniquely identifying a window
fun void sendWindow( int fileIndex, float startTime )
{
    // start the message...
    xmit.start( "/mosaic/window" );
    
    // add int argument
    fileIndex=> xmit.add;
    // add float argument
    startTime => xmit.add;
    // send it
    xmit.send();
}


Hid hid;
HidMsg msg;

// open keyboard (get device number from command line)
if( !hid.openKeyboard( KB_DEVICE ) ) me.exit();
<<< "keyboard '" + hid.name() + "' ready", "" >>>;

spork ~ kb();

fun void kb()
{
    // infinite event loop
    while( true )
    {
        // wait on event
        hid => now;
        
        // get one or more messages
        while( hid.recv( msg ) )
        {
            // check for action type
            if( msg.isButtonDown() ) // button down
            {
                <<< "down:", msg.which, "(code)", msg.key, "(usb key)", msg.ascii, "(ascii)" >>>;
                if( msg.ascii >= 49 && msg.ascii <= 58 ) // 1-8
                {
                    msg.ascii - 48 => NUM_VOICES;
                }
                else if ( msg.which == KEY_MINUS )
                {
                    -PLAYBACK => PLAYBACK;
                }
                
                else if ( msg.which == KEY_EQUAL ) // CHANGE MODE
                { 
                    -MODE_CONCAT + 1 => MODE_CONCAT; 
                    if (MODE_CONCAT)
                    {
                        reducedFeatures[knnResult[0]][0] => Zcur[0];
                        reducedFeatures[knnResult[0]][1] => Zcur[1];
                    }
                }

                else if ( msg.which == KEY_LEFT )
                {
                    Zcur[0] - 1. => Zcur[0];
                    if (Zcur[0] < dimMin[0]) dimMin[0] => Zcur[0];
                    <<< "LEFT:", Zcur[0], Zcur[1] >>>;
                }
                else if( msg.which == KEY_RIGHT )
                {
                    Zcur[0] + 1. => Zcur[0];
                    if (Zcur[0] > dimMax[0]) dimMax[0] => Zcur[0];
                    <<< "RIGHT:", Zcur[0], Zcur[1] >>>;
                }
                else if( msg.which == KEY_DOWN )
                {
                    Zcur[1] - 1. => Zcur[1];
                    if (Zcur[1] < dimMin[1]) dimMin[1] => Zcur[1];
                    <<< "DOWN:", Zcur[0], Zcur[1] >>>;
                }
                else if( msg.which == KEY_UP )
                {
                    Zcur[1] + 1. => Zcur[1];
                    if (Zcur[1] > dimMax[1]) dimMax[1] => Zcur[1];
                    <<< "UP:", Zcur[0], Zcur[1] >>>;
                }
            }
            else // button up
            {

            }
        }
    }
}

//------------------------------------------------------------------------------
// real-time similarity retrieval loop
//------------------------------------------------------------------------------
while( true )
{
    if (MODE_CONCAT)
    {
        for( int frame; frame < NUM_FRAMES; frame++ )
        {
            HOP => now;
        }
        knn.search( Zcur, K, knnResult );
        
        // which window 
        Math.random2(0,knnResult.size()-1) => int win;
        Math.INT_MAX => int diff;
        // find closest window
        if( MODE_FAVOR_CLOSEST_WINDOW && CURR_WIN != null )
        {
            for( int w; w < knnResult.size(); w++ )
            {
                if( Math.abs(windows[knnResult[w]].uid-CURR_WIN.uid) < diff )
                {
                    w => win;
                }
            }
        }
        // SYNTHESIZE THIS
        spork ~ synthesize( knnResult[win] );
    }
    else 
    {                
        spork ~ synthesize( knnResult[0] );
        (windows[1].windowTime - 0.171)::second => now;
        
        (knnResult[0] + PLAYBACK) => knnResult[0];
        if (knnResult[0] >= numPoints) 
        { 
            while (true) { 100::ms => now; } 
        }
        
        if (knnResult[0] < 0) { numPoints - 1 => knnResult[0]; }
    }
}
//------------------------------------------------------------------------------
// end of real-time similiarity retrieval loop
//------------------------------------------------------------------------------
        

//------------------------------------------------------------------------------
// function: load data file
//------------------------------------------------------------------------------
fun FileIO loadFile( string filepath )
{
    // reset
    0 => numPoints;
    0 => numCoeffs;
    
    // load data
    FileIO fio;
    if( !fio.open( filepath, FileIO.READ ) )
    {
        // error
        <<< "cannot open file:", filepath >>>;
        // close
        fio.close();
        // return
        return fio;
    }
    
    string str;
    string line;
    // read the first non-empty line
    while( fio.more() )
    {
        // read each line
        fio.readLine().trim() => str;
        // check if empty line
        if( str != "" )
        {
            numPoints++;
            str => line;
        }
    }
    
    // a string tokenizer
    StringTokenizer tokenizer;
    // set to last non-empty line
    tokenizer.set( line );
    // negative (to account for filePath windowTime)
    -2 => numCoeffs;
    // see how many, including label name
    while( tokenizer.more() )
    {
        tokenizer.next();
        numCoeffs++;
    }
    
    // see if we made it past the initial fields
    if( numCoeffs < 0 ) 0 => numCoeffs;
    
    // check
    if( numPoints == 0 || numCoeffs <= 0 )
    {
        <<< "no data in file:", filepath >>>;
        fio.close();
        return fio;
    }
    
    // print
    <<< "# of data points:", numPoints, "dimensions:", numCoeffs >>>;
    
    // done for now
    return fio;
}


//------------------------------------------------------------------------------
// function: read the data
//------------------------------------------------------------------------------
fun void readData( FileIO fio )
{
    // rewind the file reader
    fio.seek( 0 );
    
    // a line
    string line;
    // a string tokenizer
    StringTokenizer tokenizer;
    
    // points index
    0 => int index;
    // file index
    0 => int fileIndex;
    // file name
    string filename;
    // window start time
    float windowTime;
    // coefficient
    int c;
    
    // read the first non-empty line
    while( fio.more() )
    {
        // read each line
        fio.readLine().trim() => line;
        // check if empty line
        if( line != "" )
        {
            // set to last non-empty line
            tokenizer.set( line );
            // file name
            tokenizer.next() => filename;
            // window start time
            tokenizer.next() => Std.atof => windowTime;
            // have we seen this filename yet?
            if( filename2state[filename] == 0 )
            {
                // make a new string (<< appends by reference)
                filename => string sss;
                // append
                files << sss;
                // new id
                files.size() => filename2state[filename];
            }
            // get fileindex
            filename2state[filename]-1 => fileIndex;
            // set
            windows[index].set( index, fileIndex, windowTime );
            
            // zero out
            0 => c;
            // for each dimension in the data
            repeat( numCoeffs )
            {
                // read next coefficient
                tokenizer.next() => Std.atof => inFeatures[index][c];
                // increment
                c++;
            }
            
            // increment global index
            index++;
        }
    }
}