/* Serval Voice Over Mesh Protocol (VoMP) Copyright (C) 2012 Paul Gardner-Stephen Copyright (C) 2012 Serval Project Inc. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. */ /* VoMP works using a 6-state model of a phone call, and relies on MDP for auth-cryption of frames. VoMP provides it's own replay protection. */ #include "serval.h" #include "str.h" #include "strbuf.h" #include "strlcpy.h" /* Typical call state lifecycle between 2 parties. Legend; # incoming command from monitor client $ outgoing monitor status <> vomp packet with state change sent across the network Monitor Init # MONITOR VOMP [supported codec list] Dialing // client requests an outgoing call # CALL [sid] [myDid] [TheirDid] > CALLPREP + codecs + phone numbers // let the client know what token we are going to use for the remainder of the call $ CALLTO [token] [mySid] [myDid] [TheirSid] [TheirDid] // allocate a session number and tell them our codecs, // but we don't need to do anything else yet, // this might be a replay attack < NOCALL + codecs // Ok, we have a network path, lets try to establish the call $ CODECS [token] [their supported codec list] > RINGOUT $ CODECS [token] [their supported codec list] // (Note that if both parties are trying to dial each other, // the call should jump straight to INCALL) // inform client about the call request $ CALLFROM [token] [mySid] [myDid] [TheirSid] [TheirDid] // Note that we may need to wait for other external processes // before a phone is actually ringing # RING [token] < RINGIN // All good, there's a phone out there ringing, you can indicate that to the user $ RINGING [token] Answering # PICKUP [token] < INCALL // The client can now start sending audio > INCALL $ INCALL [token] // The client can now start sending audio $ INCALL [token] Tell any clients that the call hasn't timed out yet (if servald is behaving this should be redundant, if it isn't behaving how do we hangup?) $ KEEPALIVE [token] Hanging up (may also be triggered on network or call establishment timeout) # HANGUP [token] > CALLENDED $ HANGUP [token] < CALLENDED $ HANGUP [token] */ /* Minimum network format requirements; - your call session, packed integer - my call state - my sequence number Pre-ring call setup; - my call session - my supported codec list - your number - my number - my name In call audio; - codec - elapsed time from call start - audio duration - audio data (remainder of payload) Assuming minimum audio duration per packet is 20ms, 1 byte sequence should let us deal with ~2.5s of jitter. If we have >2.5s of jitter, the network is obviously too crappy to support a voice call anyway. If we can assume constant duration per codec, and I believe we can, we can use the sequence number to derive the other audio timing information. We need to resume a call even with large periods of zero traffic (eg >10s), we should be able to use our own wall clock to estimate which 5s interval the audio belongs to. */ // ideally these id's should only be used on the network, with monitor events to inform clients of state changes #define VOMP_STATE_NOCALL 1 #define VOMP_STATE_CALLPREP 2 #define VOMP_STATE_RINGINGOUT 3 #define VOMP_STATE_RINGINGIN 4 #define VOMP_STATE_INCALL 5 #define VOMP_STATE_CALLENDED 6 #define VOMP_SESSION_MASK 0xffffff #define VOMP_MAX_CALLS 16 struct vomp_call_half { unsigned char sid[SID_SIZE]; char did[64]; unsigned char state; unsigned char codec; unsigned int session; unsigned int sequence; }; struct jitter_sample{ int sample_clock; int local_clock; int delta; int sort_index; }; #define JITTER_SAMPLES 128 struct jitter_measurements{ struct jitter_sample samples[JITTER_SAMPLES]; struct jitter_sample *sorted_samples[JITTER_SAMPLES]; int next_sample; int max_sample_clock; int sample_count; }; struct vomp_call_state { struct sched_ent alarm; struct vomp_call_half local; struct vomp_call_half remote; int initiated_call; time_ms_t create_time; time_ms_t last_activity; time_ms_t audio_clock; // last local & remote status we sent to all interested parties int last_sent_status; unsigned char remote_codec_flags[CODEC_FLAGS_LENGTH]; struct jitter_measurements jitter; // track when we first heard audio, so we can calculate timing from the current sequence number int first_remote_audio_sequence; // simple ring buffer of audio sample times, used to drop duplicate incoming frames // stores end times, since this is an odd number we can initialise the buffer to zero's int sample_pos; unsigned int seen_samples[VOMP_MAX_RECENT_SAMPLES *4]; }; /* Some clients may only support one call at a time, even then we allow for multiple call states. This is partly to deal with denial of service attacks that might occur by causing the ejection of newly allocated session numbers before the caller has had a chance to progress the call to a further state. */ int vomp_call_count=0; struct vomp_call_state vomp_call_states[VOMP_MAX_CALLS]; struct profile_total vomp_stats; static void vomp_process_tick(struct sched_ent *alarm); static const char *vomp_describe_codec(int c); strbuf strbuf_append_vomp_supported_codecs(strbuf sb, const unsigned char supported_codecs[256]); void store_jitter_sample(struct jitter_measurements *measurements, int sample_clock, int local_clock){ IN(); int i; struct jitter_sample *sample = &measurements->samples[measurements->next_sample]; measurements->next_sample++; if (measurements->next_sample>=JITTER_SAMPLES) measurements->next_sample=0; int delta=(local_clock - sample_clock); int pos=0; if (measurements->sample_count>0){ int old_index = measurements->sample_count; if (measurements->sample_count>=JITTER_SAMPLES){ old_index = sample->sort_index; } // binary search to find insert position int min=0; int max=measurements->sample_count -1; while(min<=max){ pos = (max+min) / 2; if (delta <= measurements->sorted_samples[pos]->delta){ max = pos-1; }else{ pos++; min = pos; } } if (pos>=measurements->sample_count) pos=measurements->sample_count -1; // shuffle the sorted array elements for (i=old_index;i>pos;i--){ measurements->sorted_samples[i]=measurements->sorted_samples[i-1]; measurements->sorted_samples[i]->sort_index=i; } for (i=old_index;isorted_samples[i]=measurements->sorted_samples[i+1]; measurements->sorted_samples[i]->sort_index=i; } } measurements->sorted_samples[pos]=sample; if (measurements->sample_countsample_count++; sample->sample_clock = sample_clock; sample->local_clock = local_clock; sample->delta = delta; sample->sort_index = pos; if (sample_clock > measurements->max_sample_clock) measurements->max_sample_clock=sample_clock; OUT(); } int get_jitter_size(struct jitter_measurements *measurements){ IN(); int i=JITTER_SAMPLES -4; int jitter; if (i>=measurements->sample_count) i=measurements->sample_count -1; jitter=measurements->sorted_samples[i]->delta - measurements->sorted_samples[0]->delta; RETURN(jitter); } void set_codec_flag(int codec, unsigned char *flags){ if (codec<0 || codec>255) return; flags[codec >> 3] |= 1<<(codec & 7); } int is_codec_set(int codec, unsigned char *flags){ if (codec<0 || codec>255) return 0; return flags[codec >> 3] & (1<<(codec & 7)); } struct vomp_call_state *vomp_find_call_by_session(int session_token) { int i; for(i=0;ilocal.sid,SID_SIZE); bcopy(remote_sid,call->remote.sid,SID_SIZE); call->local.session=local_session; call->remote.session=remote_session; call->local.state=VOMP_STATE_NOCALL; call->remote.state=VOMP_STATE_NOCALL; call->last_sent_status=-1; call->create_time=gettime_ms(); call->last_activity=call->create_time; call->alarm.alarm = call->create_time+VOMP_CALL_STATUS_INTERVAL; call->alarm.function = vomp_process_tick; vomp_stats.name="vomp_process_tick"; call->alarm.stats=&vomp_stats; schedule(&call->alarm); if (debug & DEBUG_VOMP) DEBUGF("Returning new call #%d",local_session); return call; } struct vomp_call_state *vomp_find_or_create_call(unsigned char *remote_sid, unsigned char *local_sid, unsigned int sender_session, unsigned int recvr_session, int sender_state, int recvr_state) { int i; struct vomp_call_state *call; if (debug & DEBUG_VOMP) DEBUGF("%d calls already in progress.",vomp_call_count); for(i=0;iremote.session, call->local.session); int checked=0; if (call->remote.session&&sender_session) { checked++; if(sender_session!=call->remote.session) continue; } if (call->local.session&&recvr_session) { checked++; if(recvr_session!=call->local.session) continue; } if (!checked) continue; if (memcmp(remote_sid,call->remote.sid,SID_SIZE)) continue; if (memcmp(local_sid,call->local.sid,SID_SIZE)) continue; /* it matches. */ /* Record session number if required */ if (!call->remote.session) call->remote.session=sender_session; if (debug & DEBUG_VOMP) { DEBUGF("%06x:%06x matches call #%d %06x:%06x", sender_session,recvr_session,i, call->remote.session, call->local.session); } return call; } /* Don't create a call record if either party has ended it */ if (sender_state==VOMP_STATE_CALLENDED || recvr_state==VOMP_STATE_CALLENDED) return NULL; /* Only create a call record if either party is in CALLPREP state */ if (sender_state==VOMP_STATE_CALLPREP || recvr_state==VOMP_STATE_CALLPREP) return vomp_create_call(remote_sid, local_sid, sender_session, recvr_session); return NULL; } static void prepare_vomp_header(struct vomp_call_state *call, overlay_mdp_frame *mdp){ mdp->packetTypeAndFlags=MDP_TX; bcopy(call->local.sid,mdp->out.src.sid,SID_SIZE); mdp->out.src.port=MDP_PORT_VOMP; bcopy(call->remote.sid,mdp->out.dst.sid,SID_SIZE); mdp->out.dst.port=MDP_PORT_VOMP; mdp->out.payload[0]=0x01; /* Normal VoMP frame */ mdp->out.payload[1]=(call->remote.state<<4)|call->local.state; mdp->out.payload[2]=(call->remote.sequence>>8)&0xff; mdp->out.payload[3]=(call->remote.sequence>>0)&0xff; mdp->out.payload[4]=(call->local.sequence>>8)&0xff; mdp->out.payload[5]=(call->local.sequence>>0)&0xff; time_ms_t call_millis = gettime_ms() - call->create_time; mdp->out.payload[6]=(call_millis>>8)&0xff; mdp->out.payload[7]=(call_millis>>0)&0xff; mdp->out.payload[8]=(call->remote.session>>16)&0xff; mdp->out.payload[9]=(call->remote.session>>8)&0xff; mdp->out.payload[10]=(call->remote.session>>0)&0xff; mdp->out.payload[11]=(call->local.session>>16)&0xff; mdp->out.payload[12]=(call->local.session>>8)&0xff; mdp->out.payload[13]=(call->local.session>>0)&0xff; mdp->out.payload_length=14; } /* send updated call status to end-point and to any interested listeners as appropriate */ int vomp_send_status_remote(struct vomp_call_state *call) { overlay_mdp_frame mdp; unsigned short *len=&mdp.out.payload_length; bzero(&mdp,sizeof(mdp)); prepare_vomp_header(call, &mdp); if (call->local.state < VOMP_STATE_RINGINGOUT && call->remote.state < VOMP_STATE_RINGINGOUT) { int didLen; unsigned char codecs[CODEC_FLAGS_LENGTH]; /* Include the list of supported codecs */ monitor_get_all_supported_codecs(codecs); int i; for (i = 0; i < 256; ++i) if (is_codec_set(i,codecs)) { mdp.out.payload[(*len)++]=i; if (debug & DEBUG_VOMP) DEBUGF("I support the %s codec", vomp_describe_codec(i)); } mdp.out.payload[(*len)++]=0; /* Include src and dst phone numbers */ if (call->initiated_call){ DEBUGF("Sending phone numbers %s, %s",call->local.did,call->remote.did); didLen = snprintf((char *)(mdp.out.payload + *len), sizeof(mdp.out.payload) - *len, "%s", call->local.did); *len+=didLen+1; didLen = snprintf((char *)(mdp.out.payload + *len), sizeof(mdp.out.payload) - *len, "%s", call->remote.did); *len+=didLen+1; } if (debug & DEBUG_VOMP) DEBUGF("mdp frame with codec list is %d bytes", mdp.out.payload_length); } call->local.sequence++; overlay_mdp_dispatch(&mdp,0,NULL,0); return 0; } // copy audio into the rotor buffers int vomp_received_audio(struct vomp_call_state *call, int audio_codec, const unsigned char *audio, int audio_length) { if (call->local.state!=VOMP_STATE_INCALL) return -1; int codec_block_size=vomp_sample_size(audio_codec); int offset=0; int codec_duration = vomp_codec_timespan(audio_codec); while(offsetaudio_clock>>24)&0xff; mdp.out.payload[(*len)++]=(call->audio_clock>>16)&0xff; mdp.out.payload[(*len)++]=(call->audio_clock>>8)&0xff; mdp.out.payload[(*len)++]=(call->audio_clock>>0)&0xff; mdp.out.payload[(*len)++]=audio_codec; if (offset+codec_block_size>audio_length) codec_block_size = audio_length - offset; bcopy(audio+offset,&mdp.out.payload[(*len)],codec_block_size); (*len)+=codec_block_size; offset+=codec_block_size; call->audio_clock += codec_duration; call->local.sequence++; // send the payload more than once to add resilience to dropped packets // TODO remove once network links have built in retries mdp.out.send_copies=VOMP_MAX_RECENT_SAMPLES; overlay_mdp_dispatch(&mdp,0,NULL,0); } return 0; } int monitor_call_status(struct vomp_call_state *call) { char msg[1024]; int n = snprintf(msg,1024,"\nCALLSTATUS:%06x:%06x:%d:%d:%d:%s:%s:%s:%s\n", call->local.session,call->remote.session, call->local.state,call->remote.state, 0, alloca_tohex_sid(call->local.sid), alloca_tohex_sid(call->remote.sid), call->local.did,call->remote.did); monitor_tell_clients(msg, n, MONITOR_VOMP); return 0; } int monitor_send_audio(struct vomp_call_state *call, int audio_codec, unsigned int start_time, unsigned int end_time, const unsigned char *audio, int audio_length, int sequence) { if (0) DEBUGF("Tell call monitor about audio for call %06x:%06x", call->local.session,call->remote.session); int sample_bytes=vomp_sample_size(audio_codec); char msg[1024 + MAX_AUDIO_BYTES]; /* All commands followed by binary data start with *len:, so that they can be easily parsed at the far end, even if not supported. Put newline at start of these so that receiving data in command mode doesn't confuse the parser. */ int jitter_delay = get_jitter_size(&call->jitter); int msglen = snprintf(msg, 1024, "\n*%d:AUDIOPACKET:%x:%d:%d:%d:%d:%d\n", sample_bytes, call->local.session, audio_codec, start_time, end_time, sequence, jitter_delay); bcopy(audio, &msg[msglen], sample_bytes); msglen+=sample_bytes; msg[msglen++]='\n'; monitor_tell_clients(msg, msglen, MONITOR_VOMP); return 0; } // update local state and notify interested clients with the correct message int vomp_update_local_state(struct vomp_call_state *call, int new_state){ if (call->local.state>=new_state) return 0; if (new_state > VOMP_STATE_CALLPREP && new_state <= VOMP_STATE_INCALL && call->local.state<=VOMP_STATE_CALLPREP){ // tell clients about the remote codec list int i; unsigned char our_codecs[CODEC_FLAGS_LENGTH]; char msg[256]; monitor_get_all_supported_codecs(our_codecs); strbuf b = strbuf_local(msg, sizeof msg); strbuf_sprintf(b, "\nCODECS:%06x", call->local.session); for (i = 0; i < 256; ++i){ if (is_codec_set(i,call->remote_codec_flags) && is_codec_set(i,our_codecs)) { strbuf_sprintf(b, ":%d", i); } } strbuf_putc(b, '\n'); monitor_tell_clients(strbuf_str(b), strbuf_len(b), MONITOR_VOMP); } switch(new_state){ case VOMP_STATE_CALLPREP: // tell client our session id. monitor_tell_formatted(MONITOR_VOMP, "\nCALLTO:%06x:%s:%s:%s:%s\n", call->local.session, alloca_tohex_sid(call->local.sid), call->local.did, alloca_tohex_sid(call->remote.sid), call->remote.did); break; case VOMP_STATE_CALLENDED: monitor_tell_formatted(MONITOR_VOMP, "\nHANGUP:%06x\n", call->local.session); break; } call->local.state=new_state; return 0; } // update remote state and notify interested clients with the correct message int vomp_update_remote_state(struct vomp_call_state *call, int new_state){ if (call->remote.state>=new_state) return 0; switch(new_state){ case VOMP_STATE_RINGINGOUT: monitor_tell_formatted(MONITOR_VOMP, "\nCALLFROM:%06x:%s:%s:%s:%s\n", call->local.session, alloca_tohex_sid(call->local.sid), call->local.did, alloca_tohex_sid(call->remote.sid), call->remote.did); break; case VOMP_STATE_RINGINGIN: monitor_tell_formatted(MONITOR_VOMP, "\nRINGING:%06x\n", call->local.session); break; case VOMP_STATE_INCALL: if (call->remote.state==VOMP_STATE_RINGINGIN){ monitor_tell_formatted(MONITOR_VOMP, "\nANSWERED:%06x\n", call->local.session); } break; } call->remote.state=new_state; return 0; } // send call state updates if required. int vomp_update(struct vomp_call_state *call) { int combined_status=(call->remote.state<<4)|call->local.state; if (call->last_sent_status==combined_status) return 0; if (debug & DEBUG_VOMP) DEBUGF("Call state changed to %d %d, sending updates",call->local.state, call->remote.state); call->last_sent_status=combined_status; // tell the remote party vomp_send_status_remote(call); // tell monitor clients if (monitor_socket_count && monitor_client_interested(MONITOR_VOMP)) monitor_call_status(call); return 0; } // check a small circular buffer of recently seen audio // we're not trying to be perfect here, we still expect all clients to reorder and filter duplicates int vomp_audio_already_seen(struct vomp_call_state *call, unsigned int end_time) { int i; for(i=0;iseen_samples[i]==end_time) return 1; call->seen_samples[call->sample_pos]=end_time; call->sample_pos++; if (call->sample_pos>=VOMP_MAX_RECENT_SAMPLES *4) call->sample_pos=0; return 0; } int vomp_process_audio(struct vomp_call_state *call,unsigned int sender_duration,overlay_mdp_frame *mdp,time_ms_t now) { int ofs=14; // if (mdp->in.payload_length>14) // DEBUGF("got here (payload has %d bytes)",mdp->in.payload_length); /* Get end time marker for sample block collection */ unsigned int e=0, s=0; int sequence = call->remote.sequence; if(ofsin.payload_length) { s=mdp->in.payload[ofs++]<<24; s|=mdp->in.payload[ofs++]<<16; s|=mdp->in.payload[ofs++]<<8; s|=mdp->in.payload[ofs++]<<0; sender_duration = (s&0xFFFF0000)|sender_duration; int codec=mdp->in.payload[ofs++]; int audio_len = mdp->in.payload_length - ofs; if ((!codec)||vomp_sample_size(codec)<0) return -1; e = s + vomp_codec_timespan(codec) - 1; /* Pass audio frame to all registered listeners */ if (!vomp_audio_already_seen(call, e)){ store_jitter_sample(&call->jitter, s, now); if (monitor_socket_count) monitor_send_audio(call, codec, s, e, &mdp->in.payload[ofs], audio_len, sequence); } } return 0; } int vomp_ringing(struct vomp_call_state *call){ if (call){ if ((!call->initiated_call) && call->local.stateremote.state==VOMP_STATE_RINGINGOUT){ if (debug & DEBUG_VOMP) DEBUGF("RING RING!"); vomp_update_local_state(call, VOMP_STATE_RINGINGIN); vomp_update(call); }else return WHY("Can't ring, call is not being dialled"); } return 0; } int vomp_call_destroy(struct vomp_call_state *call) { if (debug & DEBUG_VOMP) DEBUGF("Destroying call %06x:%06x [%s,%s]", call->local.session, call->remote.session, call->local.did,call->remote.did); /* now release the call structure */ int i = (call - vomp_call_states); unschedule(&call->alarm); call->local.session=0; call->remote.session=0; vomp_call_count--; if (i!=vomp_call_count){ unschedule(&vomp_call_states[vomp_call_count].alarm); bcopy(&vomp_call_states[vomp_call_count], call, sizeof(struct vomp_call_state)); schedule(&call->alarm); } return 0; } int vomp_dial(unsigned char *local_sid, unsigned char *remote_sid, const char *local_did, const char *remote_did) { /* TODO use local_did and remote_did start putting the call together. These need to be passed to the node being called to provide caller id, and potentially handle call-routing, e.g., if it is a gateway. */ if (debug & DEBUG_VOMP) DEBUG("Dialing"); if (vomp_call_count>=VOMP_MAX_CALLS) return WHY("All call slots in use"); /* allocate unique call session token, which is how the client will refer to this call during its life */ struct vomp_call_state *call=vomp_create_call( remote_sid, local_sid, 0, 0); /* Copy local / remote phone numbers */ strlcpy(call->local.did, local_did, sizeof(call->local.did)); strlcpy(call->remote.did, remote_did, sizeof(call->remote.did)); vomp_update_local_state(call, VOMP_STATE_CALLPREP); // remember that we initiated this call, not the other party call->initiated_call = 1; /* send status update to remote, thus causing call to be created (hopefully) at far end. */ vomp_update(call); return 0; } int vomp_pickup(struct vomp_call_state *call) { if (call){ if (debug & DEBUG_VOMP) DEBUG("Picking up"); if (call->local.state<=VOMP_STATE_RINGINGIN && call->remote.state==VOMP_STATE_RINGINGOUT){ vomp_update_local_state(call, VOMP_STATE_INCALL); call->create_time=gettime_ms(); /* state machine does job of starting audio stream, just tell everyone about the changed state. */ vomp_update(call); }else return WHY("Can't pickup, call is not ringing"); } return 0; } int vomp_hangup(struct vomp_call_state *call) { if (call){ if (debug & DEBUG_VOMP) DEBUG("Hanging up"); vomp_update_local_state(call, VOMP_STATE_CALLENDED); vomp_update(call); } return 0; } int vomp_extract_remote_codec_list(struct vomp_call_state *call,overlay_mdp_frame *mdp) { int ofs=14; if (debug & DEBUG_VOMP) dump("codec list mdp frame", (unsigned char *)&mdp->in.payload[0],mdp->in.payload_length); for (;ofsin.payload_length && mdp->in.payload[ofs];ofs++){ int codec = mdp->in.payload[ofs]; set_codec_flag(codec, call->remote_codec_flags); } if (!call->initiated_call){ ofs++; if (ofsin.payload_length) ofs+=strlcpy(call->remote.did, (char *)(mdp->in.payload+ofs), sizeof(call->remote.did))+1; if (ofsin.payload_length) ofs+=strlcpy(call->local.did, (char *)(mdp->in.payload+ofs), sizeof(call->local.did)); } return 0; } /* At this point we know the MDP frame is addressed to the VoMP port, but we have not inspected the contents. As these frames are wire-format, we must pay attention to endianness. */ int vomp_mdp_received(overlay_mdp_frame *mdp) { time_ms_t now = gettime_ms(); if (mdp->packetTypeAndFlags&(MDP_NOCRYPT|MDP_NOSIGN)) { /* stream-crypted audio frame */ return WHY("not implemented"); } /* only auth-crypted frames make it this far */ struct vomp_call_state *call=NULL; switch(mdp->in.payload[0]) { case 0x01: /* Ordinary VoMP state+optional audio frame */ { int recvr_state=mdp->in.payload[1]>>4; int sender_state=mdp->in.payload[1]&0xf; unsigned int recvr_session= (mdp->in.payload[8]<<16)|(mdp->in.payload[9]<<8)|mdp->in.payload[10]; unsigned int sender_session= (mdp->in.payload[11]<<16)|(mdp->in.payload[12]<<8)|mdp->in.payload[13]; int sender_seq=(mdp->in.payload[4]<<8)+mdp->in.payload[5]; // cyclic ~1 minute timer... unsigned int sender_duration = (mdp->in.payload[6]<<8) | mdp->in.payload[7]; /* wants to create a call session. Main aim here: replay protection. An adversary should not be able to replay previous VoMP packets to cause any action. We do this by allocating a new session number for each call. As an adversary may be trying to use such replays to cause a denial of service attack we need to be able to track multiple potential session numbers even from the same SID. */ call=vomp_find_or_create_call(mdp->in.src.sid,mdp->in.dst.sid, sender_session,recvr_session, sender_state,recvr_state); if (!call) return WHY("Unable to find or create call"); if (!recvr_session && (debug & DEBUG_VOMP)) DEBUG("recvr_session==0, created call"); recvr_state = call->local.state; call->remote.sequence=sender_seq; // TODO ignore state changes if sequence is stale? // TODO ignore state changes that seem to go backwards? if ((!monitor_socket_count) &&(!monitor_client_interested(MONITOR_VOMP))) { /* No registered listener, so we cannot answer the call, so just reject it. */ WHY("Rejecting call, no listening clients"); recvr_state=VOMP_STATE_CALLENDED; /* now let the state machine progress to destroy the call */ } if (recvr_state < VOMP_STATE_RINGINGOUT && sender_state < VOMP_STATE_RINGINGOUT){ unsigned char supported_codecs[CODEC_FLAGS_LENGTH]; int i, found=0; // the other party should have given us their list of supported codecs vomp_extract_remote_codec_list(call,mdp); // make sure we have at least one codec in common monitor_get_all_supported_codecs(supported_codecs); // look for a matching bit for (i=0;iremote_codec_flags[i]){ found=1; break; } } // nope, we can't speak the same language. if (!found){ WHY("Rejecting call, no matching codecs found"); recvr_state=VOMP_STATE_CALLENDED; } } if (sender_state==VOMP_STATE_CALLENDED){ /* For whatever reason, the far end has given up on the call, so we must also move to CALLENDED no matter what state we were in */ recvr_state=VOMP_STATE_CALLENDED; } /* Consider states: our actual state, sender state, what the sender thinks our state is, and what we think the sender's state is. But largely it breaks down to what we think our state is, and what they think their state is. That leaves us with just 6X6=36 cases. */ int combined_state=recvr_state<<3 | sender_state; switch(combined_state) { case (VOMP_STATE_NOCALL<<3)|VOMP_STATE_CALLPREP: /* The remote party is in the call-prep state tryng to dial us. We'll send them our codec list, then they can tell us to ring. */ break; case (VOMP_STATE_RINGINGIN<<3)|VOMP_STATE_RINGINGOUT: /* they are ringing us and we are ringing. Lets keep doing that. */ case (VOMP_STATE_NOCALL<<3)|VOMP_STATE_RINGINGOUT: /* We have have issued a session, the remote party is now indicating that they would like us to start ringing. So change our state to RINGINGIN. */ if (call->initiated_call) // hey, quit it, we were trying to call you. recvr_state=VOMP_STATE_CALLENDED; else{ // Don't automatically transition to RINGIN, wait for a client to tell us when. } break; case (VOMP_STATE_CALLPREP<<3)|VOMP_STATE_NOCALL: case (VOMP_STATE_CALLPREP<<3)|VOMP_STATE_CALLPREP: /* We are getting ready to ring, and the other end has issued a session number, (and may be calling us at the same time). Now is the time to ring out. However, until the remote party has acknowledged with RINGIN, don't indicate their ringing state to the user. */ if (call->initiated_call){ // TODO fail the call if we can't agree on codec's recvr_state=VOMP_STATE_RINGINGOUT; }else{ recvr_state=VOMP_STATE_CALLENDED; } break; case (VOMP_STATE_RINGINGOUT<<3)|VOMP_STATE_NOCALL: case (VOMP_STATE_RINGINGOUT<<3)|VOMP_STATE_CALLPREP: /* We are calling them, and they have not yet answered, just wait */ break; case (VOMP_STATE_RINGINGOUT<<3)|VOMP_STATE_RINGINGIN: /* we are calling them and they have acknowledged it. Now we can play a tone to indicate they are ringing */ break; case (VOMP_STATE_RINGINGOUT<<3)|VOMP_STATE_RINGINGOUT: /* Woah, we're trying to dial each other?? That must have been well timed. Jump to INCALL and start audio */ recvr_state=VOMP_STATE_INCALL; // reset create time when call is established call->create_time=gettime_ms(); break; case (VOMP_STATE_INCALL<<3)|VOMP_STATE_RINGINGOUT: /* we think the call is in progress, but the far end hasn't replied yet Just wait. */ break; case (VOMP_STATE_RINGINGOUT<<3)|VOMP_STATE_INCALL: /* They have answered, we can jump to incall as well */ recvr_state=VOMP_STATE_INCALL; // reset create time when call is established call->create_time=gettime_ms(); // Fall through case (VOMP_STATE_INCALL<<3)|VOMP_STATE_INCALL: /* play any audio that they have sent us. */ vomp_process_audio(call,sender_duration,mdp,now); break; case (VOMP_STATE_CALLENDED<<3)|VOMP_STATE_NOCALL: case (VOMP_STATE_CALLENDED<<3)|VOMP_STATE_CALLPREP: case (VOMP_STATE_CALLENDED<<3)|VOMP_STATE_RINGINGOUT: case (VOMP_STATE_CALLENDED<<3)|VOMP_STATE_RINGINGIN: case (VOMP_STATE_CALLENDED<<3)|VOMP_STATE_INCALL: case (VOMP_STATE_CALLENDED<<3)|VOMP_STATE_CALLENDED: /* If we ended the call, we'll wait for the far end to reply before destroying it */ break; default: /* Any state not explicitly listed above is considered invalid and possibly stale, the packet will be completely ignored. */ WHYF("Ignoring invalid call state %d.%d",sender_state,recvr_state); return 0; } vomp_update_remote_state(call, sender_state); vomp_update_local_state(call, recvr_state); call->last_activity=gettime_ms(); // TODO if we hear a stale echo of our state should we force another outgoing packet now? // will that always cause 2 outgoing packets? /* send an update to the call status if required */ vomp_update(call); } return 0; break; default: /* unsupported VoMP frame */ WHYF("Unsupported VoMP frame type = 0x%02x",mdp->in.payload[0]); break; } return WHY("Malformed VoMP MDP packet?"); } static const char *vomp_describe_codec(int c) { switch(c) { case VOMP_CODEC_NONE: return "none"; case VOMP_CODEC_CODEC2_2400: return "CODEC2@1400"; case VOMP_CODEC_CODEC2_1400: return "CODEC2@2400"; case VOMP_CODEC_GSMHALF: return "GSM-half-rate"; case VOMP_CODEC_GSMFULL: return "GSM-full-rate"; case VOMP_CODEC_16SIGNED: return "16bit-raw"; case VOMP_CODEC_8ULAW: return "8bit-uLaw"; case VOMP_CODEC_8ALAW: return "8bit-aLaw"; case VOMP_CODEC_PCM: return "PCM@8KHz"; case VOMP_CODEC_DTMF: return "DTMF"; case VOMP_CODEC_ENGAGED: return "Engaged-tone"; case VOMP_CODEC_ONHOLD: return "On-Hold"; } return "unknown"; } int vomp_sample_size(int c) { switch(c) { case VOMP_CODEC_NONE: return 0; case VOMP_CODEC_CODEC2_2400: return 7; /* actually 2550bps, 51 bits per 20ms, but using whole byte here, so 2800bps */ case VOMP_CODEC_CODEC2_1400: return 7; /* per 40ms */ case VOMP_CODEC_GSMHALF: return 14; /* check. 5.6kbits */ case VOMP_CODEC_GSMFULL: return 33; /* padded to 13.2kbit/sec */ case VOMP_CODEC_16SIGNED: return 320; /* 8000x2bytes*0.02sec */ case VOMP_CODEC_8ULAW: return 160; case VOMP_CODEC_8ALAW: return 160; case VOMP_CODEC_PCM: return 320; case VOMP_CODEC_DTMF: return 1; case VOMP_CODEC_ENGAGED: return 0; case VOMP_CODEC_ONHOLD: return 0; } return -1; } int vomp_codec_timespan(int c) { switch(c) { case VOMP_CODEC_NONE: return 1; case VOMP_CODEC_CODEC2_2400: return 20; case VOMP_CODEC_CODEC2_1400: return 40; case VOMP_CODEC_GSMHALF: return 20; case VOMP_CODEC_GSMFULL: return 20; case VOMP_CODEC_16SIGNED: return 20; case VOMP_CODEC_8ULAW: return 20; case VOMP_CODEC_8ALAW: return 20; case VOMP_CODEC_PCM: return 20; case VOMP_CODEC_DTMF: return 80; case VOMP_CODEC_ENGAGED: return 20; case VOMP_CODEC_ONHOLD: return 20; } return -1; } int vomp_parse_dtmf_digit(char c) { if (c>='0'&&c<='9') return c-0x30; switch (c) { case 'a': case 'A': return 0xa; case 'b': case 'B': return 0xb; case 'c': case 'C': return 0xc; case 'd': case 'D': return 0xd; case '*': return 0xe; case '#': return 0xf; } return -1; } char vomp_dtmf_digit_to_char(int digit) { if (digit<0) return '?'; if (digit<10) return '0'+digit; if (digit<0xe) return 'A'+digit-0xa; if (digit==0xe) return '*'; if (digit==0xf) return '#'; return '?'; } static void vomp_process_tick(struct sched_ent *alarm) { char msg[32]; int len; time_ms_t now = gettime_ms(); struct vomp_call_state *call = (struct vomp_call_state *)alarm; /* See if any calls need to be expired. Allow VOMP_CALL_DIAL_TIMEOUT ms for the other party to ring / request ringing Allow VOMP_CALL_RING_TIMEOUT ms for the ringing party to answer Allow VOMP_CALL_NETWORK_TIMEOUT ms between received packets */ if ((call->remote.state < VOMP_STATE_RINGINGOUT && call->create_time + VOMP_CALL_DIAL_TIMEOUT < now) || (call->local.state < VOMP_STATE_INCALL && call->create_time + VOMP_CALL_RING_TIMEOUT < now) || (call->last_activity+VOMP_CALL_NETWORK_TIMEOUTlocal.state==VOMP_STATE_CALLENDED &&call->remote.state==VOMP_STATE_CALLENDED){ vomp_call_destroy(call); return; } /* update everyone if the state has changed */ vomp_update(call); /* force a packet to the other party. We are still here */ vomp_send_status_remote(call); /* tell local monitor clients the call is still alive */ len = snprintf(msg,sizeof(msg) -1,"\nKEEPALIVE:%06x\n", call->local.session); monitor_tell_clients(msg, len, MONITOR_VOMP); alarm->alarm = gettime_ms() + VOMP_CALL_STATUS_INTERVAL; alarm->deadline = alarm->alarm + VOMP_CALL_STATUS_INTERVAL/2; schedule(alarm); }