From 4a04e7ed6f313ca6d648098dc06a60d94ac10e9f Mon Sep 17 00:00:00 2001
From: Jan Kiene <jan.kiene@iis.fraunhofer.de>
Date: Wed, 15 Oct 2025 16:40:17 +0200
Subject: [PATCH 01/12] port MR 2173 from float repo

Resolve "Delay alignment in external renderer" and "External renderer crashes when rendering OMASA"
---
 Workspace_msvc/lib_rend.vcxproj |   1 +
 apps/renderer.c                 | 109 +++--
 lib_isar/lib_isar_pre_rend.c    |   4 +-
 lib_rend/ivas_prot_rend.h       |  34 ++
 lib_rend/ivas_stat_rend.h       |  16 +
 lib_rend/lib_rend.c             | 810 ++++++++++++++++++++++----------
 lib_rend/lib_rend.h             |  29 +-
 7 files changed, 689 insertions(+), 314 deletions(-)
diff --git a/Workspace_msvc/lib_rend.vcxproj b/Workspace_msvc/lib_rend.vcxproj
index 27d4a19a6..854c99a97 100644
--- a/Workspace_msvc/lib_rend.vcxproj
+++ b/Workspace_msvc/lib_rend.vcxproj
@@ -175,6 +175,7 @@
     <ClCompile Include="..\lib_rend\ivas_rom_rend.c" />
     <ClCompile Include="..\lib_rend\ivas_shoebox.c" />
     <ClCompile Include="..\lib_rend\ivas_td_decorr.c" />
+    <ClCompile Include="..\lib_rend\ivas_td_ring_buffer.c" />
     <ClCompile Include="..\lib_rend\ivas_vbap.c" />
     <ClCompile Include="..\lib_rend\lib_rend.c" />
   </ItemGroup>
diff --git a/apps/renderer.c b/apps/renderer.c
index 72a294807..2f18e1ab5 100644
--- a/apps/renderer.c
+++ b/apps/renderer.c
@@ -724,6 +724,7 @@ int main(
     SplitFileReadWrite *hSplitRendFileReadWrite;
     int16_t delayNumSamples_temp;
     int32_t delayTimeScale_temp;
+    bool flushRendererLastFrame = false;
     int16_t numSamplesRead;
     int16_t delayNumSamples = -1;
     int16_t delayNumSamples_orig = 0;
@@ -770,8 +771,11 @@ int main(
 
     CmdlnArgs args = parseCmdlnArgs( argc, argv );
 
-    if ( args.nonDiegeticPan && !( ( args.inConfig.numAudioObjects == 0 && args.inConfig.multiChannelBuses[0].audioConfig == IVAS_AUDIO_CONFIG_MONO ) ||
-                                   ( args.inConfig.numAudioObjects > 0 && args.inConfig.audioObjects[0].audioConfig == IVAS_AUDIO_CONFIG_OBA && args.inConfig.numAudioObjects == 1 ) ) )
+    if ( args.nonDiegeticPan &&
+         !( ( args.inConfig.numAudioObjects == 0 &&
+              args.inConfig.multiChannelBuses[0].audioConfig == IVAS_AUDIO_CONFIG_MONO ) ||
+            ( args.inConfig.numAudioObjects > 0 &&
+              args.inConfig.audioObjects[0].audioConfig == IVAS_AUDIO_CONFIG_OBA && args.inConfig.numAudioObjects == 1 ) ) )
     {
         fprintf( stderr, "\ninvalid configuration - non-diegetic panning requires mono or ISM1 input\n" );
         goto cleanup;
@@ -1114,7 +1118,10 @@ int main(
         IVAS_RENDER_CONFIG_DATA renderConfig;
 #endif
         /* sanity check */
-        if ( ( args.outConfig.audioConfig != IVAS_AUDIO_CONFIG_BINAURAL ) && ( args.outConfig.audioConfig != IVAS_AUDIO_CONFIG_BINAURAL_ROOM_IR ) && ( args.outConfig.audioConfig != IVAS_AUDIO_CONFIG_BINAURAL_ROOM_REVERB ) && !is_split_pre_rend_mode( &args ) )
+        if ( ( args.outConfig.audioConfig != IVAS_AUDIO_CONFIG_BINAURAL ) &&
+             ( args.outConfig.audioConfig != IVAS_AUDIO_CONFIG_BINAURAL_ROOM_IR ) &&
+             ( args.outConfig.audioConfig != IVAS_AUDIO_CONFIG_BINAURAL_ROOM_REVERB ) &&
+             !is_split_pre_rend_mode( &args ) )
         {
             fprintf( stderr, "\nExternal Renderer Config is supported only when binaural output configurations is used as output OR when Split pre-rendering mode is enabled. Exiting. \n" );
             goto cleanup;
@@ -1409,7 +1416,7 @@ int main(
     }
 
     int16_t numOutChannels;
-    if ( ( error = IVAS_REND_NumOutChannels( hIvasRend, &numOutChannels ) ) != IVAS_ERR_OK )
+    if ( ( error = IVAS_REND_GetNumOutChannels( hIvasRend, &numOutChannels ) ) != IVAS_ERR_OK )
     {
         fprintf( stderr, "\nError in IVAS_REND_NumOutChannels(): %s\n", ivas_error_to_string( error ) );
         goto cleanup;
@@ -1424,8 +1431,16 @@ int main(
         }
     }
 
-    if ( args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_CODED )
+    if ( args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_CODED || args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM )
     {
+        char *outFile = args.outMetadataFilePath;
+
+        if ( args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_CODED )
+        {
+            outFile = args.outputFilePath;
+            audioWriter = NULL;
+        }
+
         if ( ( error = IVAS_REND_GetSplitRendBitstreamHeader( hIvasRend, &bitsBuffer.config.codec, &bitsBuffer.config.poseCorrection, &bitsBuffer.config.codec_frame_size_ms, &bitsBuffer.config.isar_frame_size_ms ) ) != IVAS_ERR_OK )
         {
             fprintf( stderr, "\nError in IVAS_REND_GetSplitRendBitstreamHeader()!\n" );
@@ -1438,36 +1453,15 @@ int main(
             goto cleanup;
         }
 
-        if ( ( error = split_rend_writer_open( &hSplitRendFileReadWrite, args.outputFilePath, delayNumSamples_temp, delayTimeScale_temp, bitsBuffer.config.codec, bitsBuffer.config.poseCorrection, bitsBuffer.config.codec_frame_size_ms, bitsBuffer.config.isar_frame_size_ms, args.sampleRate, bitsBuffer.config.lc3plus_highres ) ) != IVAS_ERR_OK )
+        if ( ( error = split_rend_writer_open( &hSplitRendFileReadWrite, outFile, delayNumSamples_temp, delayTimeScale_temp, bitsBuffer.config.codec, bitsBuffer.config.poseCorrection, bitsBuffer.config.codec_frame_size_ms, bitsBuffer.config.isar_frame_size_ms, args.sampleRate, bitsBuffer.config.lc3plus_highres ) ) != IVAS_ERR_OK )
         {
-            fprintf( stderr, "\nCould not open split rend metadata file %s\n", args.outputFilePath );
+            fprintf( stderr, "\nCould not open split rend metadata file %s\n", outFile );
             goto cleanup;
         }
-        audioWriter = NULL;
     }
-    else
-    {
-        if ( args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM )
-        {
-            if ( ( error = IVAS_REND_GetSplitRendBitstreamHeader( hIvasRend, &bitsBuffer.config.codec, &bitsBuffer.config.poseCorrection, &bitsBuffer.config.codec_frame_size_ms, &bitsBuffer.config.isar_frame_size_ms ) ) != IVAS_ERR_OK )
-            {
-                fprintf( stderr, "\nError in IVAS_REND_GetSplitRendBitstreamHeader()!\n" );
-                goto cleanup;
-            }
-
-            if ( IVAS_REND_GetDelay( hIvasRend, &delayNumSamples_temp, &delayTimeScale_temp ) != IVAS_ERR_OK )
-            {
-                fprintf( stderr, "\nUnable to get delay of renderer!\n" );
-                goto cleanup;
-            }
-
-            if ( ( error = split_rend_writer_open( &hSplitRendFileReadWrite, args.outMetadataFilePath, delayNumSamples_temp, delayTimeScale_temp, bitsBuffer.config.codec, bitsBuffer.config.poseCorrection, bitsBuffer.config.codec_frame_size_ms, bitsBuffer.config.isar_frame_size_ms, args.sampleRate, bitsBuffer.config.lc3plus_highres ) ) != IVAS_ERR_OK )
-            {
-                fprintf( stderr, "\nCould not open split rend metadata file %s\n", args.outMetadataFilePath );
-                goto cleanup;
-            }
-        }
 
+    if ( args.outConfig.audioConfig != IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_CODED )
+    {
         if ( AudioFileWriter_open( &audioWriter, args.outputFilePath, args.sampleRate, numOutChannels ) != IVAS_ERR_OK )
         {
             fprintf( stderr, "\nFailed to open file: %s\n", args.outputFilePath );
@@ -1597,16 +1591,23 @@ int main(
         if ( numSamplesRead == 0 )
         {
             /* end of input data */
-            break;
+            flushRendererLastFrame = true;
         }
 
         /* Convert from int to float and from interleaved to packed */
-        convertInputBuffer( inpInt16Buffer, numSamplesRead, inBuffer.config.numSamplesPerChannel, num_in_channels, inFloatBuffer, inBuffer.config.is_cldfb, cldfbAna );
+        if ( !flushRendererLastFrame )
+        {
+            convertInputBuffer( inpInt16Buffer, numSamplesRead, inBuffer.config.numSamplesPerChannel, num_in_channels, inFloatBuffer, inBuffer.config.is_cldfb, cldfbAna );
+        }
+        else
+        {
+            memset( inBuffer.data, 0, inBuffer.config.numChannels * inBuffer.config.numSamplesPerChannel * sizeof( float ) );
+        }
 
         int16_t num_subframes, sf_idx;
         num_subframes = (int16_t) args.render_framesize;
 
-        if ( isCurrentFrameMultipleOf20ms )
+        if ( isCurrentFrameMultipleOf20ms && !flushRendererLastFrame )
         {
             IsmPositionProvider_getNextFrame( positionProvider, &mtdBuffer );
 
@@ -1718,7 +1719,7 @@ int main(
             }
             IVAS_REND_ReadOnlyAudioBuffer tmpBuffer = getReadOnlySubBuffer( inBuffer, (int16_t) args.inConfig.multiChannelBuses[i].inputChannelIndex, numChannels );
 
-            if ( ( error = IVAS_REND_FeedInputAudio( hIvasRend, mcIds[i], tmpBuffer ) ) != IVAS_ERR_OK )
+            if ( ( error = IVAS_REND_FeedInputAudio( hIvasRend, mcIds[i], tmpBuffer, flushRendererLastFrame ) ) != IVAS_ERR_OK )
             {
                 fprintf( stderr, "\nIVAS_REND_FeedInputAudio failed: %s\n", ivas_error_to_string( error ) );
                 goto cleanup;
@@ -1733,7 +1734,7 @@ int main(
                 {
                     IVAS_REND_ReadOnlyAudioBuffer tmpBuffer = getReadOnlySubBuffer( inBuffer, (int16_t) args.inConfig.audioObjects[i].inputChannelIndex, args.inConfig.numAudioObjects );
 
-                    if ( ( error = IVAS_REND_FeedInputAudio( hIvasRend, ismIds[i], tmpBuffer ) ) != IVAS_ERR_OK )
+                    if ( ( error = IVAS_REND_FeedInputAudio( hIvasRend, ismIds[i], tmpBuffer, flushRendererLastFrame ) ) != IVAS_ERR_OK )
                     {
                         fprintf( stderr, "\nIVAS_REND_FeedInputAudio failed: %s\n", ivas_error_to_string( error ) );
                         goto cleanup;
@@ -1750,7 +1751,7 @@ int main(
             {
                 IVAS_REND_ReadOnlyAudioBuffer tmpBuffer = getReadOnlySubBuffer( inBuffer, (int16_t) args.inConfig.audioObjects[i].inputChannelIndex, 1 );
 
-                if ( ( error = IVAS_REND_FeedInputAudio( hIvasRend, ismIds[i], tmpBuffer ) ) != IVAS_ERR_OK )
+                if ( ( error = IVAS_REND_FeedInputAudio( hIvasRend, ismIds[i], tmpBuffer, flushRendererLastFrame ) ) != IVAS_ERR_OK )
                 {
                     fprintf( stderr, "\nIVAS_REND_FeedInputAudio failed: %s\n", ivas_error_to_string( error ) );
                     goto cleanup;
@@ -1773,7 +1774,7 @@ int main(
             }
             IVAS_REND_ReadOnlyAudioBuffer tmpBuffer = getReadOnlySubBuffer( inBuffer, (int16_t) args.inConfig.ambisonicsBuses[i].inputChannelIndex, numChannels );
 
-            if ( ( error = IVAS_REND_FeedInputAudio( hIvasRend, sbaIds[i], tmpBuffer ) ) != IVAS_ERR_OK )
+            if ( ( error = IVAS_REND_FeedInputAudio( hIvasRend, sbaIds[i], tmpBuffer, flushRendererLastFrame ) ) != IVAS_ERR_OK )
             {
                 fprintf( stderr, "\nIVAS_REND_FeedInputAudio failed: %s\n", ivas_error_to_string( error ) );
                 goto cleanup;
@@ -1789,13 +1790,13 @@ int main(
             }
             IVAS_REND_ReadOnlyAudioBuffer tmpBuffer = getReadOnlySubBuffer( inBuffer, (int16_t) args.inConfig.masaBuses[i].inputChannelIndex, numChannels );
 
-            if ( ( error = IVAS_REND_FeedInputAudio( hIvasRend, masaIds[i], tmpBuffer ) ) != IVAS_ERR_OK )
+            if ( ( error = IVAS_REND_FeedInputAudio( hIvasRend, masaIds[i], tmpBuffer, flushRendererLastFrame ) ) != IVAS_ERR_OK )
             {
                 fprintf( stderr, "IVAS_REND_FeedInputAudio failed: %s\n", ivas_error_to_string( error ) );
                 goto cleanup;
             }
 
-            if ( isCurrentFrameMultipleOf20ms )
+            if ( isCurrentFrameMultipleOf20ms && !flushRendererLastFrame )
             {
                 if ( masaReaders[i] != NULL )
                 {
@@ -1858,7 +1859,7 @@ int main(
             zeroPad = delayNumSamples;
         }
 
-        if ( is_split_pre_rend_mode( &args ) )
+        if ( is_split_pre_rend_mode( &args ) && !flushRendererLastFrame )
         {
             if ( split_rend_write_bitstream_to_file( hSplitRendFileReadWrite, bitsBuffer.bits, &bitsBuffer.config.bitsRead,
                                                      &bitsBuffer.config.bitsWritten ) != IVAS_ERR_OK )
@@ -1868,7 +1869,7 @@ int main(
             }
         }
 
-        if ( audioWriter != NULL )
+        if ( audioWriter != NULL && !flushRendererLastFrame )
         {
             if ( delayNumSamples * num_out_channels < outBufferSize )
             {
@@ -1889,7 +1890,7 @@ int main(
         bitsBuffer.config.bitsWritten = 0;
 
         /* Write MASA metadata for MASA outputs */
-        if ( args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_MASA1 || args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_MASA2 )
+        if ( !flushRendererLastFrame && ( args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_MASA1 || args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_MASA2 ) )
         {
             IVAS_REND_AudioConfigType inputType1;
             IVAS_REND_AudioConfigType inputType2;
@@ -1961,7 +1962,8 @@ int main(
                     }
                 }
 
-                if ( ( args.inConfig.numAmbisonicsBuses > 0 || args.inConfig.numMultiChannelBuses > 0 || args.inConfig.numMasaBuses > 0 ) && args.inConfig.numAudioObjects > 0 )
+                if ( ( args.inConfig.numAmbisonicsBuses > 0 || args.inConfig.numMultiChannelBuses > 0 || args.inConfig.numMasaBuses > 0 ) &&
+                     args.inConfig.numAudioObjects > 0 )
                 {
                     inputType2 = IVAS_REND_AUDIO_CONFIG_TYPE_OBJECT_BASED;
                     if ( ( error = IVAS_REND_MergeMasaMetadata( hIvasRend, &hMetaOutput, inputType1, inputType2 ) ) != IVAS_ERR_OK )
@@ -1977,6 +1979,13 @@ int main(
             }
         }
 
+        /* no new input was actually read, only delay buffers were flushed
+         * therefore this is not a real frame */
+        if ( flushRendererLastFrame )
+        {
+            break;
+        }
+
         frame++;
         if ( !args.quietModeEnabled )
         {
@@ -1989,12 +1998,13 @@ int main(
 #endif
     }
 
-    /* add zeros at the end to have equal length of synthesized signals */
+    /* add zeros at the end to have equal length of synthesized signals
+     * the output buffer will contain either leftover input samples from delay aligned inputs
+     * or zeros for padding */
     if ( audioWriter != NULL )
     {
         for ( zeroPadToWrite = zeroPad; zeroPadToWrite > frameSize_smpls; zeroPadToWrite -= frameSize_smpls )
         {
-            memset( outInt16Buffer, 0, outBufferSize * sizeof( int16_t ) );
             if ( ( error = AudioFileWriter_write( audioWriter, outInt16Buffer, outBufferSize ) ) != IVAS_ERR_OK )
             {
                 fprintf( stderr, "\nOutput audio file writer error\n" );
@@ -2002,7 +2012,6 @@ int main(
             }
         }
 
-        memset( outInt16Buffer, 0, zeroPadToWrite * outBuffer.config.numChannels * sizeof( int16_t ) );
         if ( ( error = AudioFileWriter_write( audioWriter, outInt16Buffer, zeroPadToWrite * outBuffer.config.numChannels ) ) != IVAS_ERR_OK )
         {
             fprintf( stderr, "\nOutput audio file writer error\n" );
@@ -2011,9 +2020,10 @@ int main(
         zeroPadToWrite = 0;
     }
 
-    if ( args.inConfig.numAudioObjects != 0 && ( args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_BINAURAL || args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_BINAURAL_ROOM_REVERB ) )
+    if ( args.inConfig.numAudioObjects != 0 &&
+         ( args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_BINAURAL || args.outConfig.audioConfig == IVAS_AUDIO_CONFIG_BINAURAL_ROOM_REVERB ) )
     {
-        fprintf( stdout, "\n\nMetadata delayed %d subframes\n\n", (int16_t) round( args.syncMdDelay / ( 1000 / IVAS_NUM_FRAMES_PER_SEC / IVAS_MAX_PARAM_SPATIAL_SUBFRAMES ) ) );
+        fprintf( stdout, "\n\nMetadata delayed %d subframes\n\n", (int16_t) round( args.syncMdDelay / ( 1000.f / IVAS_NUM_FRAMES_PER_SEC / IVAS_MAX_PARAM_SPATIAL_SUBFRAMES ) ) );
     }
 
     if ( !args.quietModeEnabled && args.delayCompensationEnabled )
@@ -3433,7 +3443,8 @@ static void parseObjectPosition(
     *positionDuration = (uint16_t) strtol( line, &endptr, 10 );
     readNextMetadataChunk( line, "\n" );
 
-    read_values = (int16_t) sscanf( line, "%f,%f,%f,%f,%f,%f,%f,%f", &meta_prm[0], &meta_prm[1], &meta_prm[2], &meta_prm[3], &meta_prm[4], &meta_prm[5], &meta_prm[6], &meta_prm[7] );
+    read_values = (int16_t) sscanf( line, "%f,%f,%f,%f,%f,%f,%f,%f",
+                                    &meta_prm[0], &meta_prm[1], &meta_prm[2], &meta_prm[3], &meta_prm[4], &meta_prm[5], &meta_prm[6], &meta_prm[7] );
 
     if ( read_values < 2 )
     {
diff --git a/lib_isar/lib_isar_pre_rend.c b/lib_isar/lib_isar_pre_rend.c
index 2e6c70b47..bcd6560dc 100644
--- a/lib_isar/lib_isar_pre_rend.c
+++ b/lib_isar/lib_isar_pre_rend.c
@@ -115,9 +115,7 @@ ivas_error ISAR_PRE_REND_open(
         isCldfbNeeded = 1;
     }
 
-    hSplitBinRend->hCldfbHandles = NULL;
-
-    if ( isCldfbNeeded )
+    if ( isCldfbNeeded && hSplitBinRend->hCldfbHandles == NULL )
     {
         if ( ( hSplitBinRend->hCldfbHandles = (CLDFB_HANDLES_WRAPPER_HANDLE) malloc( sizeof( CLDFB_HANDLES_WRAPPER ) ) ) == NULL )
         {
diff --git a/lib_rend/ivas_prot_rend.h b/lib_rend/ivas_prot_rend.h
index 1a86ba3bb..7895a6134 100644
--- a/lib_rend/ivas_prot_rend.h
+++ b/lib_rend/ivas_prot_rend.h
@@ -1622,6 +1622,40 @@ void ivas_rend_closeCldfbRend(
     CLDFB_REND_WRAPPER *pCldfbRend 
 );
 
+/*----------------------------------------------------------------------------------*
+ * Time domain ring buffer prototypes
+ *----------------------------------------------------------------------------------*/
+
+ivas_error ivas_TD_RINGBUF_Open(
+    TD_RINGBUF_HANDLE *ph,                                      /* i/o: Ring buffer handle                     */
+    const uint32_t capacity_per_channel,                        /* i  : Number of samples stored per channel   */
+    const uint16_t num_channels                                 /* i  : Number of channels                     */
+);
+
+void ivas_TD_RINGBUF_Close( 
+    TD_RINGBUF_HANDLE *ph                                       /* i/o: Ring buffer handle                      */
+);
+
+void ivas_TD_RINGBUF_Push( 
+    TD_RINGBUF_HANDLE h,                                        /* i/o: Ring buffer handle                       */
+    const float *data,                                          /* i  : Input data                               */
+    const uint32_t num_samples_per_channel                      /* i  : Number of samples per channel to store   */
+);
+
+void ivas_TD_RINGBUF_PushZeros( 
+    TD_RINGBUF_HANDLE h,                                        /* i/o: Ring buffer handle                      */
+    const uint32_t num_samples_per_channel                      /* i  : Number of zeros per channel to store    */
+);
+
+void ivas_TD_RINGBUF_Pop( 
+    TD_RINGBUF_HANDLE h,                                        /* i/o: Ring buffer handle                      */
+    float *data,                                                /* i  : Output data                             */
+    const uint32_t num_samples_per_channel                      /* i  : Number of samples per channel to retrieve*/
+);
+
+uint32_t ivas_TD_RINGBUF_Size(
+    const TD_RINGBUF_HANDLE h                                   /* i  : Ring buffer handle                      */
+);
 
 /* clang-format on */
 
diff --git a/lib_rend/ivas_stat_rend.h b/lib_rend/ivas_stat_rend.h
index 67c7fbbcb..ce407e261 100644
--- a/lib_rend/ivas_stat_rend.h
+++ b/lib_rend/ivas_stat_rend.h
@@ -1498,6 +1498,22 @@ typedef struct
 } CLDFB_REND_WRAPPER;
 
 
+/*----------------------------------------------------------------------------------*
+ * Time domain ring buffer structure
+ *----------------------------------------------------------------------------------*/
+
+typedef struct
+{
+    float *data; /* samples in interleaved layout */
+    uint32_t capacity;
+    uint16_t num_channels;
+    uint32_t write_pos;
+    uint32_t read_pos;
+    int16_t is_full;
+
+} TD_RINGBUF_DATA, *TD_RINGBUF_HANDLE;
+
+
 /*----------------------------------------------------------------------------------*
  * MASA external renderer structure
  *----------------------------------------------------------------------------------*/
diff --git a/lib_rend/lib_rend.c b/lib_rend/lib_rend.c
index 07c3d6086..d70ddcdaa 100644
--- a/lib_rend/lib_rend.c
+++ b/lib_rend/lib_rend.c
@@ -81,6 +81,7 @@ typedef struct
 typedef struct
 {
     const int32_t *pOutSampleRate;
+    const int32_t *pMaxGlobalDelayNs;
     const AUDIO_CONFIG *pOutConfig;
     const LSSETUP_CUSTOM_STRUCT *pCustomLsOut;
     const EFAP_WRAPPER *pEfapOutWrapper;
@@ -97,9 +98,11 @@ typedef struct
     AUDIO_CONFIG inConfig;
     IVAS_REND_InputId id;
     IVAS_REND_AudioBuffer inputBuffer;
+    TD_RINGBUF_HANDLE delayBuffer;
     float gain; /* Linear, not in dB */
     rendering_context ctx;
     int32_t numNewSamplesPerChannel; /* Used to keep track how much new audio was fed before rendering current frame */
+    int32_t delayNumSamples;
 } input_base;
 
 typedef struct
@@ -192,6 +195,7 @@ typedef struct hrtf_handles
 struct IVAS_REND
 {
     int32_t sampleRateOut;
+    int32_t maxGlobalDelayNs;
 
     IVAS_LIMITER_HANDLE hLimiter;
 #ifdef DEBUGGING
@@ -207,11 +211,12 @@ struct IVAS_REND
     AUDIO_CONFIG outputConfig;
     EFAP_WRAPPER efapOutWrapper;
     IVAS_LSSETUP_CUSTOM_STRUCT customLsOut;
+
+    int16_t splitRendBFI;
     SPLIT_REND_WRAPPER *splitRendWrapper;
     IVAS_REND_AudioBuffer splitRendEncBuffer;
 
     IVAS_REND_HeadRotData headRotData;
-    int16_t splitRendBFI;
 
     EXTERNAL_ORIENTATION_HANDLE hExternalOrientationData;
     COMBINED_ORIENTATION_HANDLE hCombinedOrientationData;
@@ -262,6 +267,13 @@ static void freeInputBaseBufferData(
     return;
 }
 
+static int16_t latencyNsToSamples(
+    int32_t sampleRate,
+    int32_t latency_ns )
+{
+    return (int16_t) roundf( (float) ( latency_ns ) * ( sampleRate / 1000000000.f ) );
+}
+
 static ivas_error allocateMcLfeDelayBuffer(
     float **lfeDelayBuffer,
     const int16_t data_size )
@@ -369,7 +381,7 @@ static void copyBufferToCLDFBarray(
 static void accumulateCLDFBArrayToBuffer(
     float re[][CLDFB_NO_COL_MAX][CLDFB_NO_CHANNELS_MAX],
     float im[][CLDFB_NO_COL_MAX][CLDFB_NO_CHANNELS_MAX],
-    IVAS_REND_AudioBuffer *buffer )
+    const IVAS_REND_AudioBuffer *buffer )
 {
     uint32_t smplIdx, slotIdx;
     uint32_t numCldfbSamples, num_bands;
@@ -1165,6 +1177,8 @@ static void initRendInputBase(
     inputBase->gain = 1.0f;
     inputBase->ctx = rendCtx;
     inputBase->numNewSamplesPerChannel = 0;
+    inputBase->delayNumSamples = 0;
+    inputBase->delayBuffer = NULL;
 
     inputBase->inputBuffer.config.numSamplesPerChannel = 0;
     inputBase->inputBuffer.config.numChannels = 0;
@@ -1213,6 +1227,7 @@ static rendering_context getRendCtx(
     /* Note: when refactoring this, always take the ADDRESS of a member of the
      * renderer struct, so that the context stores a POINTER to the member, even
      * if the member is a pointer or handle itself. */
+    ctx.pMaxGlobalDelayNs = &hIvasRend->maxGlobalDelayNs;
     ctx.pOutConfig = &hIvasRend->outputConfig;
     ctx.pOutSampleRate = &hIvasRend->sampleRateOut;
     ctx.pCustomLsOut = &hIvasRend->customLsOut;
@@ -1255,6 +1270,272 @@ static bool isIoConfigPairSupported(
 }
 
 
+static int32_t getRendInputDelayIsm(
+    const input_ism *inputIsm,
+    bool splitPreRendCldfb )
+{
+    int32_t latency_ns;
+    latency_ns = 0;
+    (void) ( splitPreRendCldfb ); /* unused */
+
+    /* set the rendering delay in InputBase */
+    latency_ns = max( latency_ns,
+                      inputIsm->tdRendWrapper.binaural_latency_ns );
+    if ( inputIsm->crendWrapper != NULL )
+    {
+        latency_ns = max( latency_ns,
+                          inputIsm->crendWrapper->binaural_latency_ns );
+    }
+
+    return latency_ns;
+}
+
+
+static void setRendInputDelayIsm(
+    void *input,
+    bool splitPreRendCldfb )
+{
+    input_ism *inputIsm;
+    inputIsm = (input_ism *) input;
+
+    inputIsm->base.delayNumSamples = latencyNsToSamples( *inputIsm->base.ctx.pOutSampleRate,
+                                                         getRendInputDelayIsm( inputIsm, splitPreRendCldfb ) );
+}
+
+
+static int32_t getRendInputDelayMc(
+    const input_mc *inputMc,
+    bool splitPreRendCldfb )
+{
+    int32_t latency_ns;
+    latency_ns = 0;
+    (void) ( splitPreRendCldfb ); /* unused */
+
+    latency_ns = max( latency_ns,
+                      inputMc->tdRendWrapper.binaural_latency_ns );
+    if ( inputMc->crendWrapper != NULL )
+    {
+        latency_ns = max( latency_ns,
+                          inputMc->crendWrapper->binaural_latency_ns );
+    }
+
+    return latency_ns;
+}
+
+
+static void setRendInputDelayMc(
+    void *input,
+    bool splitPreRendCldfb )
+{
+    input_mc *inputMc;
+    inputMc = (input_mc *) input;
+
+    inputMc->base.delayNumSamples = latencyNsToSamples( *inputMc->base.ctx.pOutSampleRate,
+                                                        getRendInputDelayMc( inputMc, splitPreRendCldfb ) );
+}
+
+
+static int32_t getRendInputDelaySba(
+    const input_sba *inputSba,
+    bool splitPreRendCldfb )
+{
+    int32_t latency_ns;
+    latency_ns = 0;
+
+    if ( inputSba->cldfbRendWrapper.hCldfbRend != NULL )
+    {
+        latency_ns = max( latency_ns,
+                          inputSba->cldfbRendWrapper.binaural_latency_ns +
+                              ( splitPreRendCldfb ? 0 : IVAS_FB_DEC_DELAY_NS ) );
+    }
+    if ( inputSba->crendWrapper != NULL )
+    {
+        latency_ns = max( latency_ns,
+                          inputSba->crendWrapper->binaural_latency_ns );
+    }
+
+    return latency_ns;
+}
+
+
+static void setRendInputDelaySba(
+    void *input,
+    bool splitPreRendCldfb )
+{
+    input_sba *inputSba;
+    inputSba = (input_sba *) input;
+
+    inputSba->base.delayNumSamples = latencyNsToSamples( *inputSba->base.ctx.pOutSampleRate,
+                                                         getRendInputDelaySba( inputSba, splitPreRendCldfb ) );
+}
+
+
+static int32_t getRendInputDelayMasa(
+    const input_masa *inputMasa,
+    bool splitPreRendCldfb )
+{
+    int32_t latency_ns;
+
+    latency_ns = 0;
+
+    if ( ( inputMasa->base.inConfig == IVAS_AUDIO_CONFIG_MASA1 && *inputMasa->base.ctx.pOutConfig == IVAS_AUDIO_CONFIG_MONO ) ||
+         ( getAudioConfigType( *inputMasa->base.ctx.pOutConfig ) == IVAS_REND_AUDIO_CONFIG_TYPE_MASA ) )
+    {
+        return 0; /* no delay */
+    }
+    else
+    {
+        /* no delay applied for split rendering */
+        latency_ns = max( latency_ns,
+                          (int32_t) ( ( splitPreRendCldfb ? 0 : (float) IVAS_FB_DEC_DELAY_NS + 0.5f ) ) );
+    }
+    return latency_ns;
+}
+
+
+static void setRendInputDelayMasa(
+    void *input,
+    bool splitPreRendCldfb )
+{
+    input_masa *inputMasa;
+    inputMasa = (input_masa *) input;
+
+    inputMasa->base.delayNumSamples = latencyNsToSamples( *inputMasa->base.ctx.pOutSampleRate,
+                                                          getRendInputDelayMasa( inputMasa, splitPreRendCldfb ) );
+}
+
+
+static int32_t getMaxGlobalDelayNs( IVAS_REND_CONST_HANDLE hIvasRend )
+{
+    int16_t i;
+    int32_t latency_ns;
+    int32_t max_latency_ns;
+    bool splitPreRendCldfb;
+
+    max_latency_ns = 0;
+    /*assumes that input has been added which means codec has been set to either lcld or lc3plus (even if render config specified default)*/
+    if ( hIvasRend->hRendererConfig != NULL )
+    {
+        splitPreRendCldfb = ( hIvasRend->hRendererConfig->split_rend_config.codec == ISAR_SPLIT_REND_CODEC_LCLD );
+    }
+    else
+    {
+        splitPreRendCldfb = false;
+    }
+
+    /* Compute the maximum delay across all inputs */
+    for ( i = 0; i < RENDERER_MAX_ISM_INPUTS; i++ )
+    {
+        if ( hIvasRend->inputsIsm[i].base.inConfig != IVAS_AUDIO_CONFIG_INVALID )
+        {
+            latency_ns = getRendInputDelayIsm( &hIvasRend->inputsIsm[i], splitPreRendCldfb );
+            max_latency_ns = max( max_latency_ns, latency_ns );
+        }
+    }
+
+    for ( i = 0; i < RENDERER_MAX_MC_INPUTS; i++ )
+    {
+        if ( hIvasRend->inputsMc[i].base.inConfig != IVAS_AUDIO_CONFIG_INVALID )
+        {
+            latency_ns = getRendInputDelayMc( &hIvasRend->inputsMc[i], splitPreRendCldfb );
+            max_latency_ns = max( max_latency_ns, latency_ns );
+        }
+    }
+
+    for ( i = 0; i < RENDERER_MAX_SBA_INPUTS; i++ )
+    {
+        if ( hIvasRend->inputsSba[i].base.inConfig != IVAS_AUDIO_CONFIG_INVALID )
+        {
+            latency_ns = getRendInputDelaySba( &hIvasRend->inputsSba[i], splitPreRendCldfb );
+            max_latency_ns = max( max_latency_ns, latency_ns );
+        }
+    }
+
+    for ( i = 0; i < RENDERER_MAX_MASA_INPUTS; i++ )
+    {
+        if ( hIvasRend->inputsMasa[i].base.inConfig != IVAS_AUDIO_CONFIG_INVALID )
+        {
+            latency_ns = getRendInputDelayMasa( &hIvasRend->inputsMasa[i], splitPreRendCldfb );
+            max_latency_ns = max( max_latency_ns, latency_ns );
+        }
+    }
+
+    return max_latency_ns;
+}
+
+
+static void setMaxGlobalDelayNs( IVAS_REND_HANDLE hIvasRend )
+{
+    hIvasRend->maxGlobalDelayNs = getMaxGlobalDelayNs( (IVAS_REND_CONST_HANDLE) hIvasRend );
+}
+
+static ivas_error alignInputDelay(
+    input_base *inputBase,
+    const IVAS_REND_ReadOnlyAudioBuffer inputAudio,
+    const int32_t maxGlobalDelayNs,
+    const int32_t sampleRateOut,
+    const int16_t cldfb2tdSampleFact,
+    const bool flushInputs )
+{
+    ivas_error error;
+    input_ism *inputIsm;
+    int16_t maxGlobalDelaySamples;
+    int32_t numSamplesToPush, numSamplesToPop;
+    uint32_t ringBufferSize, preDelay;
+
+    maxGlobalDelaySamples = latencyNsToSamples( sampleRateOut, maxGlobalDelayNs );
+    maxGlobalDelaySamples *= cldfb2tdSampleFact;
+
+    /* check if we need to open the delay buffer */
+    if ( inputBase->delayBuffer == NULL )
+    {
+        /* buffer has to accomodate maxGlobalDelaySamples + 2 * frameSize */
+        ringBufferSize = maxGlobalDelaySamples + 2 * inputAudio.config.numSamplesPerChannel;
+
+        /* pre delay for this input is maximum delay - input delay */
+        preDelay = maxGlobalDelaySamples - inputBase->delayNumSamples * cldfb2tdSampleFact;
+
+        if ( preDelay > 0 )
+        {
+            if ( ( error = ivas_TD_RINGBUF_Open( &inputBase->delayBuffer, ringBufferSize, inputAudio.config.numChannels ) ) != IVAS_ERR_OK )
+            {
+                return error;
+            }
+
+            /* for the first frame we need to push zeros to align the input delay to the global delay
+             * and then push a frame of actual data */
+            ivas_TD_RINGBUF_PushZeros( inputBase->delayBuffer, preDelay );
+
+            /* for ISM inputs, ensure the metadata sync delay is updated */
+            if ( getAudioConfigType( inputBase->inConfig ) == IVAS_REND_AUDIO_CONFIG_TYPE_OBJECT_BASED )
+            {
+                inputIsm = (input_ism *) inputBase;
+                inputIsm->ism_metadata_delay_ms = maxGlobalDelayNs / 1e6f;
+            }
+        }
+    }
+
+    if ( inputBase->delayBuffer != NULL )
+    {
+        /* push in the new input data and pop to retrieve a complete input frame
+         * if we are flushing the inputs, we don't push in any new data */
+        numSamplesToPush = flushInputs ? 0 : inputAudio.config.numSamplesPerChannel;
+        numSamplesToPop = flushInputs ? ivas_TD_RINGBUF_Size( inputBase->delayBuffer ) : (uint32_t) inputAudio.config.numSamplesPerChannel;
+
+        ivas_TD_RINGBUF_Push( inputBase->delayBuffer, inputAudio.data, numSamplesToPush );
+        ivas_TD_RINGBUF_Pop( inputBase->delayBuffer, inputBase->inputBuffer.data, numSamplesToPop );
+    }
+    else
+    {
+        /* delay buffer isn't open - we don't need it */
+        mvr2r( inputAudio.data,
+               inputBase->inputBuffer.data,
+               inputAudio.config.numSamplesPerChannel * inputAudio.config.numChannels );
+    }
+
+    return IVAS_ERR_OK;
+}
+
 static ivas_error initIsmMasaRendering(
     input_ism *inputIsm,
     const int32_t inSampleRate )
@@ -1409,6 +1690,8 @@ static void clearInputIsm(
     rendCtx = inputIsm->base.ctx;
 
     freeInputBaseBufferData( &inputIsm->base.inputBuffer.data );
+    ivas_TD_RINGBUF_Close( &inputIsm->base.delayBuffer );
+
     initRendInputBase( &inputIsm->base, IVAS_AUDIO_CONFIG_INVALID, 0, rendCtx, NULL, 0 );
 
     /* Free input's internal handles */
@@ -2200,7 +2483,7 @@ static ivas_error initMcBinauralRendering(
 
     /* determine binaural delay ( used for aligning LFE to output signal ) */
     binauralDelayNs = max( ( inputMc->crendWrapper != NULL ) ? inputMc->crendWrapper->binaural_latency_ns : 0, inputMc->tdRendWrapper.binaural_latency_ns );
-    inputMc->binauralDelaySmp = (int16_t) roundf( (float) binauralDelayNs * *inputMc->base.ctx.pOutSampleRate / 1000000000.f );
+    inputMc->binauralDelaySmp = latencyNsToSamples( *inputMc->base.ctx.pOutSampleRate, binauralDelayNs );
 
     if ( inputMc->binauralDelaySmp > MAX_BIN_DELAY_SAMPLES )
     {
@@ -2403,6 +2686,8 @@ static void clearInputMc(
 
     freeMcLfeDelayBuffer( &inputMc->lfeDelayBuffer );
     freeInputBaseBufferData( &inputMc->bufferData );
+    ivas_TD_RINGBUF_Close( &inputMc->base.delayBuffer );
+
     initRendInputBase( &inputMc->base, IVAS_AUDIO_CONFIG_INVALID, 0, rendCtx, NULL, 0 );
 
     /* Free input's internal handles */
@@ -2726,7 +3011,7 @@ static ivas_error setRendInputActiveSba(
         return error;
     }
 
-    return error;
+    return IVAS_ERR_OK;
 }
 
 
@@ -2738,6 +3023,7 @@ static void clearInputSba(
     rendCtx = inputSba->base.ctx;
 
     freeInputBaseBufferData( &inputSba->bufferData );
+    ivas_TD_RINGBUF_Close( &inputSba->base.delayBuffer );
 
     initRendInputBase( &inputSba->base, IVAS_AUDIO_CONFIG_INVALID, 0, rendCtx, NULL, 0 );
 
@@ -2822,6 +3108,7 @@ static void clearInputMasa(
     rendCtx = inputMasa->base.ctx;
 
     freeInputBaseBufferData( &inputMasa->bufferData );
+    ivas_TD_RINGBUF_Close( &inputMasa->base.delayBuffer );
 
     masaPrerendClose( &inputMasa->hMasaPrerend );
     freeMasaExtRenderer( &inputMasa->hMasaExtRend );
@@ -2890,7 +3177,7 @@ ivas_error IVAS_REND_Open(
     hIvasRend->num_subframes = num_subframes;
 
     /* Initialize limiter */
-    if ( ( error = IVAS_REND_NumOutChannels( hIvasRend, &numOutChannels ) ) != IVAS_ERR_OK )
+    if ( ( error = IVAS_REND_GetNumOutChannels( hIvasRend, &numOutChannels ) ) != IVAS_ERR_OK )
     {
         return error;
     }
@@ -2947,6 +3234,10 @@ ivas_error IVAS_REND_Open(
 
         isar_init_split_rend_handles( hIvasRend->splitRendWrapper );
     }
+    hIvasRend->splitRendEncBuffer.data = NULL;
+    hIvasRend->splitRendEncBuffer.config.is_cldfb = 0;
+    hIvasRend->splitRendEncBuffer.config.numChannels = 0;
+    hIvasRend->splitRendEncBuffer.config.numSamplesPerChannel = 0;
 
     for ( i = 0; i < RENDERER_MAX_ISM_INPUTS; ++i )
     {
@@ -3142,7 +3433,7 @@ ivas_error IVAS_REND_ConfigureCustomOutputLoudspeakerLayout(
     hIvasRend->customLsOut = makeCustomLsSetup( layout );
 
     /* Re-initialize limiter - number of output channels may have changed */
-    if ( ( error = IVAS_REND_NumOutChannels( hIvasRend, &numOutChannels ) ) != IVAS_ERR_OK )
+    if ( ( error = IVAS_REND_GetNumOutChannels( hIvasRend, &numOutChannels ) ) != IVAS_ERR_OK )
     {
         return error;
     }
@@ -3199,12 +3490,12 @@ ivas_error IVAS_REND_ConfigureCustomOutputLoudspeakerLayout(
 
 
 /*-------------------------------------------------------------------*
- * IVAS_REND_NumOutChannels()
+ * IVAS_REND_GetNumOutChannels()
  *
  *
  *-------------------------------------------------------------------*/
 
-ivas_error IVAS_REND_NumOutChannels(
+ivas_error IVAS_REND_GetNumOutChannels(
     IVAS_REND_CONST_HANDLE hIvasRend,
     int16_t *numOutChannels )
 {
@@ -3422,10 +3713,15 @@ static int16_t getCldfbRendFlag(
     const IVAS_REND_AudioConfigType new_configType )
 {
     int16_t i;
-    int16_t numMasaInputs = 0, numSbaInputs = 0, numIsmInputs = 0, numMcInputs = 0;
+    int16_t numMasaInputs = 0, numSbaInputs = 0;
     int16_t isCldfbRend;
 
     isCldfbRend = 0;
+    /* This function is called during three different phases of renderer processing:
+     * - IVAS_REND_AddInput()
+     * - IVAS_REND_FeedRenderConfig()
+     * - IVAS_REND_GetSplitBinauralBitstream()
+     * Only the last case can assume all inputs are present for the current frame to be rendered */
     if ( hIvasRend->hRendererConfig != NULL )
     {
         for ( i = 0; i < RENDERER_MAX_MASA_INPUTS; ++i )
@@ -3436,24 +3732,8 @@ static int16_t getCldfbRendFlag(
         {
             numSbaInputs += ( hIvasRend->inputsSba[i].base.inConfig == IVAS_AUDIO_CONFIG_INVALID && new_configType != IVAS_REND_AUDIO_CONFIG_TYPE_AMBISONICS ) ? 0 : 1;
         }
-        for ( i = 0; i < RENDERER_MAX_ISM_INPUTS; ++i )
-        {
-            numIsmInputs += ( hIvasRend->inputsIsm[i].base.inConfig == IVAS_AUDIO_CONFIG_INVALID && new_configType != IVAS_REND_AUDIO_CONFIG_TYPE_OBJECT_BASED ) ? 0 : 1;
-        }
-        for ( i = 0; i < RENDERER_MAX_MC_INPUTS; ++i )
-        {
-            numMcInputs += ( hIvasRend->inputsMc[i].base.inConfig == IVAS_AUDIO_CONFIG_INVALID && new_configType != IVAS_REND_AUDIO_CONFIG_TYPE_CHANNEL_BASED ) ? 0 : 1;
-        }
 
-        if ( numIsmInputs > 0 || numMcInputs > 0 )
-        {
-            isCldfbRend = 0;
-        }
-#ifdef FIX_HRTF_LOAD
-        else if ( ( numMasaInputs > 0 ) || ( numSbaInputs > 0 && hIvasRend->hRendererConfig->split_rend_config.rendererSelection == IVAS_BIN_RENDERER_TYPE_FASTCONV ) )
-#else
-        else if ( ( numMasaInputs > 0 ) || ( numSbaInputs > 0 && hIvasRend->hRendererConfig->split_rend_config.rendererSelection == ISAR_SPLIT_REND_RENDERER_SELECTION_FASTCONV ) )
-#endif
+        if ( ( numMasaInputs > 0 ) || ( numSbaInputs > 0 && hIvasRend->hRendererConfig->split_rend_config.rendererSelection == IVAS_BIN_RENDERER_TYPE_FASTCONV ) )
         {
             isCldfbRend = 1;
         }
@@ -3463,12 +3743,12 @@ static int16_t getCldfbRendFlag(
 }
 
 /*-------------------------------------------------------------------------
- * Function ivas_pre_rend_init()
+ * Function isar_pre_rend_init()
  *
  *
  *------------------------------------------------------------------------*/
 
-static ivas_error ivas_pre_rend_init(
+static ivas_error isar_pre_rend_init(
     SPLIT_REND_WRAPPER *pSplitRendWrapper,
     IVAS_REND_AudioBuffer *pSplitRendEncBuffer,
     ISAR_SPLIT_REND_CONFIG_DATA *pSplit_rend_config,
@@ -3478,10 +3758,20 @@ static ivas_error ivas_pre_rend_init(
     const int16_t cldfb_in_flag,
     const int16_t num_subframes )
 {
+    bool realloc;
     ivas_error error;
     IVAS_REND_AudioBufferConfig bufConfig;
 
-    if ( outConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_CODED || outConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM )
+    realloc = false;
+
+    /* only perform init if split rendering output */
+    if ( outConfig != IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_CODED && outConfig != IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM )
+    {
+        return IVAS_ERR_OK;
+    }
+
+    /* these functions should only be called once during initial allocation */
+    if ( pSplitRendEncBuffer->data == NULL )
     {
         if ( pSplit_rend_config->poseCorrectionMode == ISAR_SPLIT_REND_POSE_CORRECTION_MODE_CLDFB )
         {
@@ -3496,28 +3786,34 @@ static ivas_error ivas_pre_rend_init(
         {
             return error;
         }
+    }
+
+    /* We may need to change the allocated buffer size if a new input is added.
+     * If the cldfb_in_flag is different from what was previously allocated for the buffer, change the size */
+    if ( pSplitRendEncBuffer->data != NULL && ( cldfb_in_flag != pSplitRendEncBuffer->config.is_cldfb ) )
+    {
+        realloc = true;
+    }
 
-        /*allocate for CLDFB in and change to TD during process if needed*/
-        bufConfig.numSamplesPerChannel = MAX_CLDFB_BUFFER_LENGTH_PER_CHANNEL;
+    if ( pSplitRendEncBuffer->data == NULL || realloc )
+    {
+        /* set buffer config */
+        bufConfig.is_cldfb = cldfb_in_flag;
+        bufConfig.numSamplesPerChannel = cldfb_in_flag ? MAX_CLDFB_BUFFER_LENGTH_PER_CHANNEL : L_FRAME_MAX;
         bufConfig.numChannels = BINAURAL_CHANNELS * pSplitRendWrapper->multiBinPoseData.num_poses;
-        bufConfig.is_cldfb = 1;
         pSplitRendEncBuffer->config = bufConfig;
 
+        /* allocate memory */
+        if ( realloc )
+        {
+            free( pSplitRendEncBuffer->data );
+        }
+
         if ( ( pSplitRendEncBuffer->data = malloc( bufConfig.numChannels * bufConfig.numSamplesPerChannel * sizeof( float ) ) ) == NULL )
         {
             return IVAS_ERR_FAILED_ALLOC;
         }
     }
-    else
-    {
-        IVAS_REND_AudioBufferConfig bufConfig2;
-
-        bufConfig2.numSamplesPerChannel = 0;
-        bufConfig2.numChannels = 0;
-        bufConfig2.is_cldfb = 0;
-        pSplitRendEncBuffer->config = bufConfig2;
-        pSplitRendEncBuffer->data = NULL;
-    }
 
     return IVAS_ERR_OK;
 }
@@ -3540,7 +3836,10 @@ ivas_error IVAS_REND_AddInput(
     void *inputsArray;
     int32_t inputStructSize;
     ivas_error ( *activateInput )( void *, AUDIO_CONFIG, IVAS_REND_InputId, RENDER_CONFIG_DATA *, hrtf_handles *hrtfs );
+    void ( *setInputDelay )( void *, bool );
     int32_t inputIndex;
+    bool splitPreRendCldfb;
+    splitPreRendCldfb = false;
 
     /* Validate function arguments */
     if ( hIvasRend == NULL || inputId == NULL )
@@ -3548,15 +3847,24 @@ ivas_error IVAS_REND_AddInput(
         return IVAS_ERR_UNEXPECTED_NULL_POINTER;
     }
 
-    if ( ( hIvasRend->outputConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_CODED || hIvasRend->outputConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM ) && hIvasRend->splitRendEncBuffer.data == NULL && hIvasRend->hRendererConfig != NULL )
+    if ( hIvasRend->hRendererConfig != NULL )
     {
         int16_t cldfb_in_flag;
         cldfb_in_flag = getCldfbRendFlag( hIvasRend, getAudioConfigType( inConfig ) );
 
-        if ( ( error = ivas_pre_rend_init( hIvasRend->splitRendWrapper, &hIvasRend->splitRendEncBuffer, &hIvasRend->hRendererConfig->split_rend_config, hIvasRend->headRotData, hIvasRend->sampleRateOut, hIvasRend->outputConfig, cldfb_in_flag, hIvasRend->num_subframes ) ) != IVAS_ERR_OK )
+        if ( ( error = isar_pre_rend_init( hIvasRend->splitRendWrapper,
+                                           &hIvasRend->splitRendEncBuffer,
+                                           &hIvasRend->hRendererConfig->split_rend_config,
+                                           hIvasRend->headRotData,
+                                           hIvasRend->sampleRateOut,
+                                           hIvasRend->outputConfig,
+                                           cldfb_in_flag,
+                                           hIvasRend->num_subframes ) ) != IVAS_ERR_OK )
         {
             return error;
         }
+        /*assumes that input has been added which means codec has been set to either lcld or lc3plus (even if render config specified default)*/
+        splitPreRendCldfb = ( hIvasRend->hRendererConfig->split_rend_config.codec == ISAR_SPLIT_REND_CODEC_LCLD );
     }
 
     switch ( getAudioConfigType( inConfig ) )
@@ -3566,24 +3874,28 @@ ivas_error IVAS_REND_AddInput(
             inputsArray = hIvasRend->inputsIsm;
             inputStructSize = sizeof( *hIvasRend->inputsIsm );
             activateInput = setRendInputActiveIsm;
+            setInputDelay = setRendInputDelayIsm;
             break;
         case IVAS_REND_AUDIO_CONFIG_TYPE_CHANNEL_BASED:
             maxNumInputsOfType = RENDERER_MAX_MC_INPUTS;
             inputsArray = hIvasRend->inputsMc;
             inputStructSize = sizeof( *hIvasRend->inputsMc );
             activateInput = setRendInputActiveMc;
+            setInputDelay = setRendInputDelayMc;
             break;
         case IVAS_REND_AUDIO_CONFIG_TYPE_AMBISONICS:
             maxNumInputsOfType = RENDERER_MAX_SBA_INPUTS;
             inputsArray = hIvasRend->inputsSba;
             inputStructSize = sizeof( *hIvasRend->inputsSba );
             activateInput = setRendInputActiveSba;
+            setInputDelay = setRendInputDelaySba;
             break;
         case IVAS_REND_AUDIO_CONFIG_TYPE_MASA:
             maxNumInputsOfType = RENDERER_MAX_MASA_INPUTS;
             inputsArray = hIvasRend->inputsMasa;
             inputStructSize = sizeof( *hIvasRend->inputsMasa );
             activateInput = setRendInputActiveMasa;
+            setInputDelay = setRendInputDelayMasa;
             break;
         default:
             return IVAS_ERR_INVALID_INPUT_FORMAT;
@@ -3600,6 +3912,14 @@ ivas_error IVAS_REND_AddInput(
     {
         return error;
     }
+#ifdef CODE_IMPROVEMENTS
+    setInputDelay( getInputByIndex( inputsArray, inputIndex, inputType ), splitPreRendCldfb );
+#else
+    setInputDelay( (uint8_t *) inputsArray + inputStructSize * inputIndex, splitPreRendCldfb );
+#endif
+
+    /* set global maximum delay after adding an input */
+    setMaxGlobalDelayNs( hIvasRend );
 
     return IVAS_ERR_OK;
 }
@@ -3882,6 +4202,9 @@ ivas_error IVAS_REND_RemoveInput(
             return IVAS_ERR_INVALID_INPUT_FORMAT;
     }
 
+    /* set global maximum delay after removing an input */
+    setMaxGlobalDelayNs( hIvasRend );
+
     return IVAS_ERR_OK;
 }
 
@@ -3958,11 +4281,6 @@ ivas_error IVAS_REND_GetDelay(
     int32_t *timeScale                /* o  : Time scale of the delay, equal to renderer output sampling rate   */
 )
 {
-    /* TODO tmu : this function only returns the maximum delay across all inputs
-     * Ideally each input has its own delay buffer and everything is aligned (binaural and LFE filtering delays are nonuniform)
-     */
-    int16_t i;
-    int32_t latency_ns;
     int32_t max_latency_ns;
 
     /* Validate function arguments */
@@ -3971,75 +4289,11 @@ ivas_error IVAS_REND_GetDelay(
         return IVAS_ERR_UNEXPECTED_NULL_POINTER;
     }
 
-    *timeScale = hIvasRend->sampleRateOut;
     *nSamples = 0;
-    max_latency_ns = 0;
-
-    /* Compute the maximum delay across all inputs */
-    for ( i = 0; i < RENDERER_MAX_ISM_INPUTS; i++ )
-    {
-        if ( hIvasRend->inputsIsm[i].base.inConfig != IVAS_AUDIO_CONFIG_INVALID )
-        {
-            latency_ns = max( ( hIvasRend->inputsIsm[i].crendWrapper != NULL ) ? hIvasRend->inputsIsm[i].crendWrapper->binaural_latency_ns : 0,
-                              hIvasRend->inputsIsm[i].tdRendWrapper.binaural_latency_ns );
-            max_latency_ns = max( max_latency_ns, latency_ns );
-        }
-    }
-
-    for ( i = 0; i < RENDERER_MAX_MC_INPUTS; i++ )
-    {
-        if ( hIvasRend->inputsMc[i].base.inConfig != IVAS_AUDIO_CONFIG_INVALID )
-        {
-            latency_ns = max( ( hIvasRend->inputsMc[i].crendWrapper != NULL ) ? hIvasRend->inputsMc[i].crendWrapper->binaural_latency_ns : 0,
-                              hIvasRend->inputsMc[i].tdRendWrapper.binaural_latency_ns );
-            max_latency_ns = max( max_latency_ns, latency_ns );
-        }
-    }
-
-    for ( i = 0; i < RENDERER_MAX_SBA_INPUTS; i++ )
-    {
-        if ( hIvasRend->inputsSba[i].base.inConfig != IVAS_AUDIO_CONFIG_INVALID )
-        {
-            if ( hIvasRend->splitRendWrapper != NULL && hIvasRend->splitRendWrapper->hBinHrSplitPreRend != NULL )
-            {
-#ifdef FIX_HRTF_LOAD
-                if ( hIvasRend->hRendererConfig->split_rend_config.rendererSelection == IVAS_BIN_RENDERER_TYPE_FASTCONV )
-#else
-                if ( hIvasRend->hRendererConfig->split_rend_config.rendererSelection == ISAR_SPLIT_REND_RENDERER_SELECTION_FASTCONV )
-#endif
-                {
-                    latency_ns = hIvasRend->inputsSba[i].cldfbRendWrapper.binaural_latency_ns;
-                }
-                else
-                {
-                    latency_ns = ( hIvasRend->inputsSba[i].crendWrapper != NULL ) ? hIvasRend->inputsSba[i].crendWrapper->binaural_latency_ns : 0;
-                }
-                max_latency_ns = max( max_latency_ns, latency_ns );
-            }
-            else if ( hIvasRend->inputsSba[i].cldfbRendWrapper.hCldfbRend != NULL )
-            {
-                latency_ns = hIvasRend->inputsSba[i].cldfbRendWrapper.binaural_latency_ns;
-                latency_ns += IVAS_FB_DEC_DELAY_NS;
-                max_latency_ns = max( max_latency_ns, latency_ns );
-            }
-            else
-            {
-                latency_ns = ( hIvasRend->inputsSba[i].crendWrapper != NULL ) ? hIvasRend->inputsSba[i].crendWrapper->binaural_latency_ns : 0;
-                max_latency_ns = max( max_latency_ns, latency_ns );
-            }
-        }
-    }
-
-    for ( i = 0; i < RENDERER_MAX_MASA_INPUTS; i++ )
-    {
-        if ( hIvasRend->inputsMasa[i].base.inConfig != IVAS_AUDIO_CONFIG_INVALID )
-        {
-            latency_ns = (int32_t) ( (float) IVAS_FB_DEC_DELAY_NS + 0.5f );
-            max_latency_ns = max( max_latency_ns, latency_ns );
-        }
-    }
+    *timeScale = hIvasRend->sampleRateOut;
+    max_latency_ns = getMaxGlobalDelayNs( hIvasRend );
 
-    *nSamples = (int16_t) roundf( (float) max_latency_ns * *timeScale / 1000000000.f );
+    *nSamples = latencyNsToSamples( hIvasRend->sampleRateOut, max_latency_ns );
 
     return IVAS_ERR_OK;
 }
@@ -4052,9 +4306,10 @@ ivas_error IVAS_REND_GetDelay(
  *-------------------------------------------------------------------*/
 
 ivas_error IVAS_REND_FeedInputAudio(
-    IVAS_REND_HANDLE hIvasRend,                    /* i/o: Renderer handle          */
-    const IVAS_REND_InputId inputId,               /* i  : ID of the input          */
-    const IVAS_REND_ReadOnlyAudioBuffer inputAudio /* i  : buffer with input audio  */
+    IVAS_REND_HANDLE hIvasRend,                     /* i/o: Renderer handle          */
+    const IVAS_REND_InputId inputId,                /* i  : ID of the input          */
+    const IVAS_REND_ReadOnlyAudioBuffer inputAudio, /* i  : buffer with input audio  */
+    const bool flushInputs                          /* i  : flush input audio        */
 )
 {
     ivas_error error;
@@ -4110,9 +4365,16 @@ ivas_error IVAS_REND_FeedInputAudio(
     }
 
     inputBase->inputBuffer.config = inputAudio.config;
-
-    mvr2r( inputAudio.data, inputBase->inputBuffer.data, inputAudio.config.numSamplesPerChannel * inputAudio.config.numChannels );
-
+    if ( ( error = alignInputDelay(
+               inputBase,
+               inputAudio,
+               hIvasRend->maxGlobalDelayNs,
+               hIvasRend->sampleRateOut,
+               cldfb2tdSampleFact,
+               flushInputs ) ) != IVAS_ERR_OK )
+    {
+        return error;
+    }
     inputBase->numNewSamplesPerChannel = inputAudio.config.numSamplesPerChannel / cldfb2tdSampleFact;
 
     return IVAS_ERR_OK;
@@ -4433,6 +4695,7 @@ int16_t IVAS_REND_FeedRenderConfig(
             if ( pMasaInput->hMasaExtRend->hDiracDecBin[0] != NULL && pMasaInput->hMasaExtRend->hDiracDecBin[0]->hReverb != NULL )
             {
                 ivas_binaural_reverb_close( &pMasaInput->hMasaExtRend->hDiracDecBin[0]->hReverb );
+
                 if ( ( error = ivas_binaural_reverb_init( &pMasaInput->hMasaExtRend->hDiracDecBin[0]->hReverb, // Todo 1892
                                                           hIvasRend->hHrtfs.hHrtfStatistics,
                                                           pMasaInput->hMasaExtRend->hSpatParamRendCom->num_freq_bands,
@@ -4449,6 +4712,7 @@ int16_t IVAS_REND_FeedRenderConfig(
             if ( pMasaInput->hMasaExtRend->hReverb != NULL )
             {
                 ivas_binaural_reverb_close( &pMasaInput->hMasaExtRend->hReverb );
+
                 if ( ( error = ivas_binaural_reverb_init( &pMasaInput->hMasaExtRend->hReverb, // Todo 1892
                                                           hIvasRend->hHrtfs.hHrtfStatistics,
                                                           pMasaInput->hMasaExtRend->hSpatParamRendCom->num_freq_bands,
@@ -4481,6 +4745,7 @@ int16_t IVAS_REND_FeedRenderConfig(
                 return error;
             }
         }
+
         if ( pMcInput->crendWrapper != NULL && pMcInput->crendWrapper->hCrend[0] != NULL && pMcInput->crendWrapper->hCrend[0]->hReverb != NULL )
         {
             if ( ( error = ivas_reverb_open( &pMcInput->crendWrapper->hCrend[0]->hReverb, hIvasRend->hHrtfs.hHrtfStatistics, hRenderConfig, *pMcInput->base.ctx.pOutSampleRate ) ) != IVAS_ERR_OK )
@@ -4531,6 +4796,7 @@ int16_t IVAS_REND_FeedRenderConfig(
     {
         int16_t cldfb_in_flag;
         cldfb_in_flag = getCldfbRendFlag( hIvasRend, IVAS_REND_AUDIO_CONFIG_TYPE_UNKNOWN );
+
         if ( hIvasRend->splitRendWrapper != NULL )
         {
             ISAR_PRE_REND_close( hIvasRend->splitRendWrapper, &hIvasRend->splitRendEncBuffer );
@@ -4538,7 +4804,7 @@ int16_t IVAS_REND_FeedRenderConfig(
             hIvasRend->splitRendWrapper = NULL;
         }
 
-        if ( ( error = ivas_pre_rend_init( hIvasRend->splitRendWrapper, &hIvasRend->splitRendEncBuffer, &hIvasRend->hRendererConfig->split_rend_config, hIvasRend->headRotData, hIvasRend->sampleRateOut, hIvasRend->outputConfig, cldfb_in_flag, hIvasRend->num_subframes ) ) != IVAS_ERR_OK )
+        if ( ( error = isar_pre_rend_init( hIvasRend->splitRendWrapper, &hIvasRend->splitRendEncBuffer, &hIvasRend->hRendererConfig->split_rend_config, hIvasRend->headRotData, hIvasRend->sampleRateOut, hIvasRend->outputConfig, cldfb_in_flag, hIvasRend->num_subframes ) ) != IVAS_ERR_OK )
         {
             return error;
         }
@@ -5268,7 +5534,7 @@ static ivas_error renderIsmToBinaural(
 
     push_wmops( "renderIsmToBinaural" );
     /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
-    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000 / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
+    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
     copyBufferTo2dArray( ismInput->base.inputBuffer, tmpTDRendBuffer );
 
     if ( ( error = ivas_td_binaural_renderer_ext( &ismInput->tdRendWrapper, ismInput->base.inConfig, NULL, ismInput->base.ctx.pCombinedOrientationData, &ismInput->currentPos, ismInput->hReverb, ism_md_subframe_update_ext,
@@ -5471,7 +5737,7 @@ static ivas_error renderIsmToBinauralReverb(
     push_wmops( "renderIsmToBinauralRoom" );
 
     /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
-    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000 / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
+    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
 
     copyBufferTo2dArray( ismInput->base.inputBuffer, tmpRendBuffer );
 
@@ -5637,8 +5903,10 @@ static ivas_error renderIsmToSplitBinaural(
     const MULTI_BIN_REND_POSE_DATA *pMultiBinPoseData;
     const SPLIT_REND_WRAPPER *pSplitRendWrapper;
     IVAS_QUATERNION originalHeadRot[MAX_PARAM_SPATIAL_SUBFRAMES];
-    int16_t i;
+    int16_t i, ch, slot_idx, num_bands;
     float tmpBinaural[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS][L_FRAME48k];
+    float tmpBinaural_CldfbRe[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS][CLDFB_NO_COL_MAX][CLDFB_NO_CHANNELS_MAX];
+    float tmpBinaural_CldfbIm[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS][CLDFB_NO_COL_MAX][CLDFB_NO_CHANNELS_MAX];
     int16_t output_frame = ismInput->base.inputBuffer.config.numSamplesPerChannel;
     COMBINED_ORIENTATION_HANDLE pCombinedOrientationData;
     int16_t ism_md_subframe_update_ext;
@@ -5649,7 +5917,7 @@ static ivas_error renderIsmToSplitBinaural(
     pMultiBinPoseData = &pSplitRendWrapper->multiBinPoseData;
 
     /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
-    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000 / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
+    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
 
     pCombinedOrientationData = *ismInput->base.ctx.pCombinedOrientationData;
 
@@ -5705,10 +5973,29 @@ static ivas_error renderIsmToSplitBinaural(
             return error;
         }
 
-        /* Copy rendered audio to tmp storage buffer. Copying directly to output would
-         * overwrite original audio, which is still needed for rendering next head pose. */
-        mvr2r( tmpProcessing[0], tmpBinaural[2 * pos_idx], output_frame );
-        mvr2r( tmpProcessing[1], tmpBinaural[2 * pos_idx + 1], output_frame );
+        if ( outAudio.config.is_cldfb )
+        {
+            /* Perform CLDFB analysis on rendered audio, since the output buffer is CLDFB domain */
+            num_bands = (int16_t) ( ( BINAURAL_MAXBANDS * *ismInput->base.ctx.pOutSampleRate ) / 48000 );
+            for ( ch = 0; ch < BINAURAL_CHANNELS; ch++ )
+            {
+                for ( slot_idx = 0; slot_idx < IVAS_CLDFB_NO_COL_MAX; slot_idx++ )
+                {
+                    cldfbAnalysis_ts( &tmpProcessing[ch][num_bands * slot_idx],
+                                      &tmpBinaural_CldfbRe[BINAURAL_CHANNELS * pos_idx + ch][slot_idx][0],
+                                      &tmpBinaural_CldfbIm[BINAURAL_CHANNELS * pos_idx + ch][slot_idx][0],
+                                      num_bands,
+                                      ismInput->base.ctx.pSplitRendWrapper->hCldfbHandles->cldfbAna[pos_idx + ch] );
+                }
+            }
+        }
+        else
+        {
+            /* Copy rendered audio to tmp storage buffer. Copying directly to output would
+             * overwrite original audio, which is still needed for rendering next head pose. */
+            mvr2r( tmpProcessing[0], tmpBinaural[BINAURAL_CHANNELS * pos_idx], output_frame );
+            mvr2r( tmpProcessing[1], tmpBinaural[BINAURAL_CHANNELS * pos_idx + 1], output_frame );
+        }
 
         /* Overwrite processing buffer with original input audio again */
         copyBufferTo2dArray( ismInput->base.inputBuffer, tmpProcessing );
@@ -5720,7 +6007,14 @@ static ivas_error renderIsmToSplitBinaural(
         pCombinedOrientationData->Quaternions[i] = originalHeadRot[i];
     }
 
-    accumulate2dArrayToBuffer( tmpBinaural, &outAudio );
+    if ( outAudio.config.is_cldfb )
+    {
+        accumulateCLDFBArrayToBuffer( tmpBinaural_CldfbRe, tmpBinaural_CldfbIm, &outAudio );
+    }
+    else
+    {
+        accumulate2dArrayToBuffer( tmpBinaural, &outAudio );
+    }
     pop_wmops();
 
     /* Encoding to split rendering bitstream done at a higher level */
@@ -5755,11 +6049,13 @@ static ivas_error renderInputIsm(
 {
     ivas_error error;
     IVAS_REND_AudioBuffer inAudio;
+    int16_t cldfb2tdSampleFact;
 
     error = IVAS_ERR_OK;
     inAudio = ismInput->base.inputBuffer;
 
-    if ( ismInput->base.numNewSamplesPerChannel != outAudio.config.numSamplesPerChannel )
+    cldfb2tdSampleFact = outAudio.config.is_cldfb ? 2 : 1;
+    if ( ismInput->base.numNewSamplesPerChannel * cldfb2tdSampleFact != outAudio.config.numSamplesPerChannel )
     {
         return IVAS_ERROR( IVAS_ERR_INVALID_BUFFER_SIZE, "Mismatch between the number of input samples vs number of requested output samples - currently not allowed" );
     }
@@ -5884,8 +6180,7 @@ static ivas_error renderLfeToBinaural(
     num_cpy_smpl_prev_frame = mcInput->binauralDelaySmp;
     num_cpy_smpl_cur_frame = frame_size - num_cpy_smpl_prev_frame;
 
-    /* Assuming LFE should be delayed by less that the duration of one frame */
-    assert( mcInput->binauralDelaySmp < frame_size );
+    assert( mcInput->binauralDelaySmp <= MAX_BIN_DELAY_SAMPLES );
 
     /* Get delayed LFE signal from previous frame, apply gain and save in tmp buffer */
     v_multc( mcInput->lfeDelayBuffer, gain, tmpLfeBuffer, num_cpy_smpl_prev_frame );
@@ -7363,8 +7658,8 @@ ivas_error IVAS_REND_MergeMasaMetadata(
 )
 {
     MASA_DECODER_EXT_OUT_META_HANDLE inMeta2;
-    float( *inEne1 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
-    float( *inEne2 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
+    float ( *inEne1 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
+    float ( *inEne2 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
 
     if ( hIvasRend == NULL )
     {
@@ -7487,15 +7782,13 @@ ivas_error IVAS_REND_SetIsmMetadataDelay(
  *-------------------------------------------------------------------*/
 
 static ivas_error getSamplesInternal(
-    IVAS_REND_HANDLE hIvasRend, /* i/o: Renderer handle          */
-    IVAS_REND_AudioBuffer outAudio /* i/o: buffer for output audio  */,
-    IVAS_REND_BitstreamBuffer *hBits /*i/o: buffer for input/output bitstream. Needed in split rendering mode*/
+    IVAS_REND_HANDLE hIvasRend,    /* i/o: Renderer handle          */
+    IVAS_REND_AudioBuffer outAudio /* i/o: buffer for output audio  */
 )
 {
     ivas_error error;
     int16_t numOutChannels;
     int16_t cldfb2tdSampleFact;
-    IVAS_REND_AudioBuffer outAudioOrig;
 
     /* Validate function arguments */
     if ( hIvasRend == NULL || outAudio.data == NULL )
@@ -7555,34 +7848,21 @@ static ivas_error getSamplesInternal(
         }
     }
 
-    if ( ( error = IVAS_REND_NumOutChannels( hIvasRend, &numOutChannels ) ) != IVAS_ERR_OK )
+    if ( ( error = IVAS_REND_GetNumOutChannels( hIvasRend, &numOutChannels ) ) != IVAS_ERR_OK )
     {
         return error;
     }
 
-    if ( numOutChannels != outAudio.config.numChannels && hIvasRend->outputConfig != IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_CODED && hIvasRend->outputConfig != IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM )
+    if ( numOutChannels != outAudio.config.numChannels &&
+         hIvasRend->outputConfig != IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_CODED &&
+         hIvasRend->outputConfig != IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM )
     {
         return IVAS_ERR_WRONG_NUM_CHANNELS;
     }
 
-    /* Clear original output buffer */
+    /* Clear output buffer */
     set_zero( outAudio.data, outAudio.config.numChannels * outAudio.config.numSamplesPerChannel );
 
-    outAudioOrig = outAudio;
-    /* Use internal buffer if outputting split rendering bitstream */
-    if ( ( hIvasRend->outputConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_CODED ) ||
-         ( hIvasRend->outputConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM ) )
-    {
-        int16_t num_poses_orig;
-        num_poses_orig = hIvasRend->splitRendWrapper->multiBinPoseData.num_poses;
-        outAudio = hIvasRend->splitRendEncBuffer;
-        ISAR_PRE_REND_GetMultiBinPoseData( &hIvasRend->hRendererConfig->split_rend_config, &hIvasRend->splitRendWrapper->multiBinPoseData, hIvasRend->headRotData.sr_pose_pred_axis );
-        assert( num_poses_orig == hIvasRend->splitRendWrapper->multiBinPoseData.num_poses && "number of poses should not change dynamically" );
-
-        /* Clear output buffer for split rendering bitstream */
-        set_zero( outAudio.data, outAudio.config.numChannels * outAudio.config.numSamplesPerChannel );
-    }
-
     if ( ( error = renderActiveInputsIsm( hIvasRend, outAudio ) ) != IVAS_ERR_OK )
     {
         return error;
@@ -7603,73 +7883,26 @@ static ivas_error getSamplesInternal(
         return error;
     }
 
-    if ( hIvasRend->outputConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_CODED || hIvasRend->outputConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM )
-    {
-        ISAR_SPLIT_REND_BITS_DATA bits;
-        int16_t cldfb_in_flag;
-        float Cldfb_RealBuffer_Binaural[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS][CLDFB_NO_COL_MAX][CLDFB_NO_CHANNELS_MAX];
-        float Cldfb_ImagBuffer_Binaural[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS][CLDFB_NO_COL_MAX][CLDFB_NO_CHANNELS_MAX];
-        int16_t ch;
-        int16_t i, ro_md_flag;
-        float *tmpBinaural[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS], tmpBinaural_buff[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS][L_FRAME48k];
-
-        for ( ch = 0; ch < MAX_OUTPUT_CHANNELS; ch++ )
-        {
-            tmpBinaural[ch] = tmpBinaural_buff[ch];
-        }
-
-        if ( outAudio.config.is_cldfb == 1 )
-        {
-            cldfb_in_flag = 1;
-            copyBufferToCLDFBarray( outAudio, Cldfb_RealBuffer_Binaural, Cldfb_ImagBuffer_Binaural );
-        }
-        else
-        {
-            cldfb_in_flag = 0;
-            copyBufferTo2dArray( outAudio, tmpBinaural_buff );
-        }
+    return IVAS_ERR_OK;
+}
 
-        /* Encode split rendering bitstream */
-        convertBitsBufferToInternalBitsBuff( *hBits, &bits );
 
-        ro_md_flag = 0;
-        for ( i = 0; i < RENDERER_MAX_ISM_INPUTS; ++i )
-        {
-            if ( hIvasRend->inputsIsm[i].base.inConfig != IVAS_AUDIO_CONFIG_INVALID )
-            {
-                ro_md_flag = 1;
-                break;
-            }
-        }
-
-        if ( ( error = ISAR_PRE_REND_MultiBinToSplitBinaural( hIvasRend->splitRendWrapper,
-                                                              hIvasRend->headRotData.headPositions[0],
-                                                              hIvasRend->hRendererConfig->split_rend_config.splitRendBitRate,
-                                                              hIvasRend->hRendererConfig->split_rend_config.codec,
-                                                              hIvasRend->hRendererConfig->split_rend_config.isar_frame_size_ms,
-                                                              hIvasRend->hRendererConfig->split_rend_config.codec_frame_size_ms,
-                                                              &bits,
-                                                              Cldfb_RealBuffer_Binaural,
-                                                              Cldfb_ImagBuffer_Binaural,
-                                                              ( const int16_t )( ( BINAURAL_MAXBANDS * hIvasRend->sampleRateOut ) / 48000 ),
-                                                              tmpBinaural,
-                                                              1,
-                                                              cldfb_in_flag,
-                                                              ( hIvasRend->outputConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM ) ? 1 : 0,
-                                                              ro_md_flag ) ) != IVAS_ERR_OK )
-        {
-            return error;
-        }
-
-        convertInternalBitsBuffToBitsBuffer( hBits, bits );
+/*-------------------------------------------------------------------*
+ * IVAS_REND_GetSamples()
+ *
+ *
+ *-------------------------------------------------------------------*/
 
-        /* reset to outAudioOrig in case of PCM output */
-        outAudio = outAudioOrig;
+ivas_error IVAS_REND_GetSamples(
+    IVAS_REND_HANDLE hIvasRend,    /* i/o: Renderer handle          */
+    IVAS_REND_AudioBuffer outAudio /* i/o: buffer for output audio  */
+)
+{
+    ivas_error error;
 
-        if ( hIvasRend->outputConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM )
-        {
-            accumulate2dArrayToBuffer( tmpBinaural_buff, &outAudio );
-        }
+    if ( ( error = getSamplesInternal( hIvasRend, outAudio ) ) != IVAS_ERR_OK )
+    {
+        return error;
     }
 
     if ( outAudio.config.is_cldfb == 0 )
@@ -7689,52 +7922,133 @@ static ivas_error getSamplesInternal(
 }
 
 
-/*-------------------------------------------------------------------*
- * IVAS_REND_GetSamples()
- *
- *
- *-------------------------------------------------------------------*/
-
-ivas_error IVAS_REND_GetSamples(
-    IVAS_REND_HANDLE hIvasRend,    /* i/o: Renderer handle          */
-    IVAS_REND_AudioBuffer outAudio /* i/o: buffer for output audio  */
-)
-{
-
-    return getSamplesInternal( hIvasRend, outAudio, NULL );
-}
-
-
 /*-------------------------------------------------------------------*
  * IVAS_REND_GetSplitBinauralBitstream()
  *
  *
  *-------------------------------------------------------------------*/
 
-ivas_error
-IVAS_REND_GetSplitBinauralBitstream(
+ivas_error IVAS_REND_GetSplitBinauralBitstream(
     IVAS_REND_HANDLE hIvasRend,      /* i/o: Renderer handle             */
     IVAS_REND_AudioBuffer outAudio,  /* i/o: buffer for output audio     */
     IVAS_REND_BitstreamBuffer *hBits /* o  : buffer for output bitstream */
 )
 {
+    ivas_error error;
+    int16_t ch;
     int16_t cldfb_in_flag;
+    int16_t i, ro_md_flag;
+    int16_t num_poses_orig;
+    float *tmpBinaural[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS], tmpBinaural_buff[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS][L_FRAME48k];
+    float Cldfb_ImagBuffer_Binaural[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS][CLDFB_NO_COL_MAX][CLDFB_NO_CHANNELS_MAX];
+    float Cldfb_RealBuffer_Binaural[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS][CLDFB_NO_COL_MAX][CLDFB_NO_CHANNELS_MAX];
+    IVAS_REND_AudioBufferConfig *pSplitEncBufConfig;
+    ISAR_SPLIT_REND_CONFIG_HANDLE pSplitRendConfig;
+    ISAR_SPLIT_REND_BITS_DATA bits;
+
+    for ( ch = 0; ch < MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS; ch++ )
+    {
+        tmpBinaural[ch] = tmpBinaural_buff[ch];
+    }
 
     cldfb_in_flag = getCldfbRendFlag( hIvasRend, IVAS_REND_AUDIO_CONFIG_TYPE_UNKNOWN );
-    hIvasRend->splitRendEncBuffer.config.is_cldfb = cldfb_in_flag;
-    if ( hIvasRend->hRendererConfig->split_rend_config.dof == 0 || hIvasRend->hRendererConfig->split_rend_config.poseCorrectionMode == ISAR_SPLIT_REND_POSE_CORRECTION_MODE_NONE )
+    pSplitEncBufConfig = &hIvasRend->splitRendEncBuffer.config;
+    pSplitRendConfig = &hIvasRend->hRendererConfig->split_rend_config;
+
+    /* 0 DoF / No pose correction retains frame size */
+    pSplitEncBufConfig->is_cldfb = cldfb_in_flag;
+    if ( pSplitRendConfig->dof == 0 || pSplitRendConfig->poseCorrectionMode == ISAR_SPLIT_REND_POSE_CORRECTION_MODE_NONE )
     {
-        hIvasRend->splitRendEncBuffer.config.numSamplesPerChannel = outAudio.config.numSamplesPerChannel;
+        pSplitEncBufConfig->numSamplesPerChannel = outAudio.config.numSamplesPerChannel;
     }
+    /* Pose correction requires 20ms */
     else
     {
-        hIvasRend->splitRendEncBuffer.config.numSamplesPerChannel = (int16_t) ( hIvasRend->sampleRateOut / FRAMES_PER_SEC );
+        pSplitEncBufConfig->numSamplesPerChannel = (int16_t) ( hIvasRend->sampleRateOut / FRAMES_PER_SEC );
     }
-    hIvasRend->splitRendEncBuffer.config.numSamplesPerChannel *= cldfb_in_flag ? 2 : 1;
+    pSplitEncBufConfig->numSamplesPerChannel *= cldfb_in_flag ? 2 : 1;
+
+    num_poses_orig = hIvasRend->splitRendWrapper->multiBinPoseData.num_poses;
+    ISAR_PRE_REND_GetMultiBinPoseData( pSplitRendConfig,
+                                       &hIvasRend->splitRendWrapper->multiBinPoseData,
+                                       hIvasRend->headRotData.sr_pose_pred_axis );
+    assert( num_poses_orig == hIvasRend->splitRendWrapper->multiBinPoseData.num_poses && "number of poses should not change dynamically" );
 
-    /* hIvasRend->splitRendEncBuffer used for BINAURAL_SPLIT_CODED output
-       outAudio used for BINAURAL_SPLIT_PCM output */
-    return getSamplesInternal( hIvasRend, outAudio, hBits );
+    /* hIvasRend->splitRendEncBuffer contains multi-pose data for BINAURAL_SPLIT_CODED output
+       outAudio used later for main pose BINAURAL_SPLIT_PCM output */
+    if ( ( error = getSamplesInternal( hIvasRend, hIvasRend->splitRendEncBuffer ) ) != IVAS_ERR_OK )
+    {
+        return error;
+    }
+
+    /* copy outputs */
+    if ( hIvasRend->splitRendEncBuffer.config.is_cldfb == 1 )
+    {
+        cldfb_in_flag = 1;
+        copyBufferToCLDFBarray( hIvasRend->splitRendEncBuffer, Cldfb_RealBuffer_Binaural, Cldfb_ImagBuffer_Binaural );
+    }
+    else
+    {
+        cldfb_in_flag = 0;
+        copyBufferTo2dArray( hIvasRend->splitRendEncBuffer, tmpBinaural_buff );
+    }
+
+    /* Encode split rendering bitstream */
+    convertBitsBufferToInternalBitsBuff( *hBits, &bits );
+
+    ro_md_flag = 0;
+    for ( i = 0; i < RENDERER_MAX_ISM_INPUTS; ++i )
+    {
+        if ( hIvasRend->inputsIsm[i].base.inConfig != IVAS_AUDIO_CONFIG_INVALID )
+        {
+            ro_md_flag = 1;
+            break;
+        }
+    }
+
+    if ( ( error = ISAR_PRE_REND_MultiBinToSplitBinaural( hIvasRend->splitRendWrapper,
+                                                          hIvasRend->headRotData.headPositions[0],
+                                                          pSplitRendConfig->splitRendBitRate,
+                                                          pSplitRendConfig->codec,
+                                                          pSplitRendConfig->isar_frame_size_ms,
+                                                          pSplitRendConfig->codec_frame_size_ms,
+                                                          &bits,
+                                                          Cldfb_RealBuffer_Binaural,
+                                                          Cldfb_ImagBuffer_Binaural,
+                                                          (const int16_t) ( ( BINAURAL_MAXBANDS * hIvasRend->sampleRateOut ) / 48000 ),
+                                                          tmpBinaural,
+                                                          1,
+                                                          cldfb_in_flag,
+                                                          ( hIvasRend->outputConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM ) ? 1 : 0,
+                                                          ro_md_flag ) ) != IVAS_ERR_OK )
+    {
+        return error;
+    }
+
+    convertInternalBitsBuffToBitsBuffer( hBits, bits );
+
+    /* copy over first pose data to outAudio */
+    if ( hIvasRend->outputConfig == IVAS_AUDIO_CONFIG_BINAURAL_SPLIT_PCM )
+    {
+        /* set outAudio to zero - getSamplesInternal only cleared splitRendEncBuffer */
+        set_zero( outAudio.data, outAudio.config.numChannels * outAudio.config.numSamplesPerChannel );
+        accumulate2dArrayToBuffer( tmpBinaural_buff, &outAudio );
+    }
+
+    if ( outAudio.config.is_cldfb == 0 )
+    {
+#ifndef DISABLE_LIMITER
+#ifdef DEBUGGING
+        hIvasRend->numClipping +=
+#endif
+            limitRendererOutput( hIvasRend->hLimiter, outAudio.data, outAudio.config.numSamplesPerChannel, IVAS_LIMITER_THRESHOLD );
+#endif
+    }
+
+    /* update global cominbed orientation start index */
+    ivas_combined_orientation_update_start_index( hIvasRend->hCombinedOrientationData, outAudio.config.numSamplesPerChannel );
+
+    return IVAS_ERR_OK;
 }
 
 ivas_error IVAS_REND_GetSplitRendBitstreamHeader(
diff --git a/lib_rend/lib_rend.h b/lib_rend/lib_rend.h
index 4ed038df9..7bed7dc1e 100644
--- a/lib_rend/lib_rend.h
+++ b/lib_rend/lib_rend.h
@@ -107,15 +107,15 @@ typedef enum _IVAS_REND_COMPLEXITY_LEVEL
 /* Functions to be called before rendering */
 
 ivas_error IVAS_REND_Open(
-   IVAS_REND_HANDLE *phIvasRend,                    /* i/o: Pointer to renderer handle                          */
-   const int32_t outputSampleRate,                  /* i  : output sampling rate                                */
-   const IVAS_AUDIO_CONFIG outConfig,               /* i  : output audio config                                 */    
-    const bool asHrtfBinary,                        /* i  : load hrtf binary file                               */ 
-   const int16_t nonDiegeticPan,                    /* i  : non-diegetic object flag                            */
-   const float nonDiegeticPanGain,                  /* i  : non-diegetic panning gain                           */
-    const int16_t Opt_Headrotation,                  /* i  : indicates whether head-rotation is used             */
-    const int16_t Opt_ExternalOrientation,           /* i  : indicates whether external orientations are used    */
-    const int16_t num_subframes                      /* i  : number of subframes                                 */
+    IVAS_REND_HANDLE *phIvasRend,                    /* i/o: Pointer to renderer handle                         */
+    const int32_t outputSampleRate,                  /* i  : output sampling rate                               */
+    const IVAS_AUDIO_CONFIG outConfig,               /* i  : output audio config                                */
+    const bool asHrtfBinary,                         /* i  : load hrtf binary file                              */
+    const int16_t nonDiegeticPan,                    /* i  : non-diegetic object flag                           */
+    const float nonDiegeticPanGain,                  /* i  : non-diegetic panning gain                          */
+    const int16_t Opt_Headrotation,                  /* i  : indicates whether head-rotation is used            */
+    const int16_t Opt_ExternalOrientation,           /* i  : indicates whether external orientations are used   */
+    const int16_t num_subframes                      /* i  : number of subframes                                */
 );
 
 /* Note: this will reset custom LFE routings set for any MC input */
@@ -127,7 +127,7 @@ ivas_error IVAS_REND_ConfigureCustomOutputLoudspeakerLayout(
 
 /* Functions to be called before/during rendering */
 
-ivas_error IVAS_REND_NumOutChannels(
+ivas_error IVAS_REND_GetNumOutChannels(
     IVAS_REND_CONST_HANDLE hIvasRend,               /* i  : Renderer handle                                     */
     int16_t *numOutChannels                         /* o  : number of output channels                           */
 );
@@ -218,9 +218,10 @@ ivas_error IVAS_REND_GetHrtfStatisticsHandle(
 /* Functions to be called during rendering */
 
 ivas_error IVAS_REND_FeedInputAudio(
-    IVAS_REND_HANDLE hIvasRend,                     /* i/o: Renderer handle                                     */
-    const IVAS_REND_InputId inputId,                /* i  : ID of the input                                     */
-    const IVAS_REND_ReadOnlyAudioBuffer inputAudio  /* i  : buffer with input audio                             */
+    IVAS_REND_HANDLE hIvasRend,                      /* i/o: Renderer handle                                    */
+    const IVAS_REND_InputId inputId,                 /* i  : ID of the input                                    */
+    const IVAS_REND_ReadOnlyAudioBuffer inputAudio,  /* i  : buffer with input audio                            */
+    const bool flushInputs                           /* i  : flush input audio                                  */
 );
 
 ivas_error IVAS_REND_FeedInputObjectMetadata(
@@ -389,7 +390,7 @@ ivas_error IVAS_REND_GetSamples(
 /* Functions to be called after rendering */
 
 void IVAS_REND_Close(
-    IVAS_REND_HANDLE* phIvasRend                    /* i/o: Pointer to renderer handle                          */
+    IVAS_REND_HANDLE *phIvasRend                    /* i/o: Pointer to renderer handle                          */
 );
 
 
-- 
GitLab


From dbcc7fe866ab79afa15c392e9f80d67d444694c7 Mon Sep 17 00:00:00 2001
From: Jan Kiene <jan.kiene@iis.fraunhofer.de>
Date: Thu, 16 Oct 2025 16:55:51 +0200
Subject: [PATCH 02/12] apply clang-format

---
 lib_rend/lib_rend.c | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/lib_rend/lib_rend.c b/lib_rend/lib_rend.c
index be41a9dbd..a621956a9 100644
--- a/lib_rend/lib_rend.c
+++ b/lib_rend/lib_rend.c
@@ -7602,8 +7602,8 @@ ivas_error IVAS_REND_MergeMasaMetadata(
 )
 {
     MASA_DECODER_EXT_OUT_META_HANDLE inMeta2;
-    float ( *inEne1 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
-    float ( *inEne2 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
+    float( *inEne1 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
+    float( *inEne2 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
 
     if ( hIvasRend == NULL )
     {
@@ -7959,7 +7959,7 @@ ivas_error IVAS_REND_GetSplitBinauralBitstream(
                                                           &bits,
                                                           Cldfb_RealBuffer_Binaural,
                                                           Cldfb_ImagBuffer_Binaural,
-                                                          (const int16_t) ( ( BINAURAL_MAXBANDS * hIvasRend->sampleRateOut ) / 48000 ),
+                                                          ( const int16_t )( ( BINAURAL_MAXBANDS * hIvasRend->sampleRateOut ) / 48000 ),
                                                           tmpBinaural,
                                                           1,
                                                           cldfb_in_flag,
-- 
GitLab


From 6f3ffe536453218dab74eb42d9d997213d5b558d Mon Sep 17 00:00:00 2001
From: Jan Kiene <jan.kiene@iis.fraunhofer.de>
Date: Thu, 16 Oct 2025 17:10:01 +0200
Subject: [PATCH 03/12] fix incorrect port in one file + add forgotten file

---
 lib_rend/ivas_td_ring_buffer.c | 288 +++++++++++++++++++++++++++++++++
 lib_rend/lib_rend.c            |   6 +-
 2 files changed, 289 insertions(+), 5 deletions(-)
 create mode 100644 lib_rend/ivas_td_ring_buffer.c

diff --git a/lib_rend/ivas_td_ring_buffer.c b/lib_rend/ivas_td_ring_buffer.c
new file mode 100644
index 000000000..5c9c6089b
--- /dev/null
+++ b/lib_rend/ivas_td_ring_buffer.c
@@ -0,0 +1,288 @@
+/******************************************************************************************************
+
+   (C) 2022-2025 IVAS codec Public Collaboration with portions copyright Dolby International AB, Ericsson AB,
+   Fraunhofer-Gesellschaft zur Foerderung der angewandten Forschung e.V., Huawei Technologies Co. LTD.,
+   Koninklijke Philips N.V., Nippon Telegraph and Telephone Corporation, Nokia Technologies Oy, Orange,
+   Panasonic Holdings Corporation, Qualcomm Technologies, Inc., VoiceAge Corporation, and other
+   contributors to this repository. All Rights Reserved.
+
+   This software is protected by copyright law and by international treaties.
+   The IVAS codec Public Collaboration consisting of Dolby International AB, Ericsson AB,
+   Fraunhofer-Gesellschaft zur Foerderung der angewandten Forschung e.V., Huawei Technologies Co. LTD.,
+   Koninklijke Philips N.V., Nippon Telegraph and Telephone Corporation, Nokia Technologies Oy, Orange,
+   Panasonic Holdings Corporation, Qualcomm Technologies, Inc., VoiceAge Corporation, and other
+   contributors to this repository retain full ownership rights in their respective contributions in
+   the software. This notice grants no license of any kind, including but not limited to patent
+   license, nor is any license granted by implication, estoppel or otherwise.
+
+   Contributors are required to enter into the IVAS codec Public Collaboration agreement before making
+   contributions.
+
+   This software is provided "AS IS", without any express or implied warranties. The software is in the
+   development stage. It is intended exclusively for experts who have experience with such software and
+   solely for the purpose of inspection. All implied warranties of non-infringement, merchantability
+   and fitness for a particular purpose are hereby disclaimed and excluded.
+
+   Any dispute, controversy or claim arising under or in relation to providing this software shall be
+   submitted to and settled by the final, binding jurisdiction of the courts of Munich, Germany in
+   accordance with the laws of the Federal Republic of Germany excluding its conflict of law rules and
+   the United Nations Convention on Contracts on the International Sales of Goods.
+
+*******************************************************************************************************/
+
+#include <assert.h>
+#include <stdlib.h>
+#include "ivas_error_utils.h"
+#include "ivas_prot_rend.h"
+#include "options.h"
+#include "wmc_auto.h"
+
+
+/*-----------------------------------------------------------------------*
+ * Local function prototypes
+ *-----------------------------------------------------------------------*/
+
+static uint32_t ivas_td_ringbuf_total_size(
+    TD_RINGBUF_HANDLE h )
+{
+    if ( h->is_full )
+    {
+        return h->capacity;
+    }
+
+    if ( h->read_pos <= h->write_pos )
+    {
+        return h->write_pos - h->read_pos;
+    }
+    /* else wrap around */
+    return h->write_pos + h->capacity - h->read_pos;
+}
+
+
+static int16_t ivas_td_ringbuf_has_space_for_num_samples(
+    TD_RINGBUF_HANDLE h,
+    const uint32_t num_samples )
+{
+    return (int16_t) ( ivas_td_ringbuf_total_size( h ) + num_samples <= h->capacity );
+}
+
+
+/*-----------------------------------------------------------------------*
+ * Global function definitions
+ *-----------------------------------------------------------------------*/
+
+/*---------------------------------------------------------------------*
+ * ivas_TD_RINGBUF_Open()
+ *
+ * Allocate a ring buffer for TD data with the given capacity of TD samples per channel.
+ *
+ * May return IVAS_ERR_FAILED_ALLOC on failed allocation, or IVAS_ERR_OK otherwise.
+ *---------------------------------------------------------------------*/
+
+ivas_error ivas_TD_RINGBUF_Open(
+    TD_RINGBUF_HANDLE *ph,               /* i/o: Ring buffer handle                     */
+    const uint32_t capacity_per_channel, /* i  : Number of samples stored per channel   */
+    const uint16_t num_channels          /* i  : Number of channels                     */
+)
+{
+    TD_RINGBUF_HANDLE h;
+    uint32_t capacity;
+
+    capacity = capacity_per_channel * num_channels;
+
+    h = malloc( sizeof( TD_RINGBUF_DATA ) );
+    if ( h == NULL )
+    {
+        return IVAS_ERROR( IVAS_ERR_FAILED_ALLOC, "Failed to allocate memory for TD ring buffer\n" );
+    }
+    h->data = NULL;
+    h->capacity = 0;
+    h->num_channels = num_channels;
+    h->write_pos = 0;
+    h->read_pos = 0;
+    h->is_full = 0;
+    *ph = h;
+
+    h->data = malloc( capacity * sizeof( float ) );
+    if ( h->data == NULL )
+    {
+        return IVAS_ERROR( IVAS_ERR_FAILED_ALLOC, "Failed to allocate memory for TD ring buffer\n" );
+    }
+    h->capacity = capacity;
+
+    return IVAS_ERR_OK;
+}
+
+
+/*---------------------------------------------------------------------*
+ * ivas_TD_RINGBUF_Close()
+ *
+ * Dellocate TD ring buffer. The given handle will be set to NULL.
+
+ *---------------------------------------------------------------------*/
+
+void ivas_TD_RINGBUF_Close(
+    TD_RINGBUF_HANDLE *ph /* i/o: Ring buffer handle */
+)
+{
+    TD_RINGBUF_HANDLE h;
+
+    if ( ph == NULL )
+    {
+        return;
+    }
+    h = *ph;
+
+    if ( h == NULL )
+    {
+        return;
+    }
+
+    if ( h->data != NULL )
+    {
+        free( h->data );
+    }
+
+    free( h );
+    *ph = NULL;
+
+    return;
+}
+
+
+/*---------------------------------------------------------------------*
+ * ivas_TD_RINGBUF_Push()
+ *
+ * Push samples onto the back of the TD ring buffer.
+ * Returns total number of buffered samples (includes number of channels)
+ *---------------------------------------------------------------------*/
+
+void ivas_TD_RINGBUF_Push(
+    TD_RINGBUF_HANDLE h,                   /* i/o: Ring buffer handle                       */
+    const float *data,                     /* i  : Input data                               */
+    const uint32_t num_samples_per_channel /* i  : Number of samples per channel to store   */
+)
+{
+    uint32_t s;
+    uint16_t c;
+
+    assert( ivas_td_ringbuf_has_space_for_num_samples( h, num_samples_per_channel * h->num_channels ) );
+
+    for ( s = 0; s < num_samples_per_channel; ++s )
+    {
+        for ( c = 0; c < h->num_channels; ++c )
+        {
+            h->data[h->write_pos] = *( data + c * num_samples_per_channel + s );
+            ++h->write_pos;
+
+            if ( h->write_pos == h->capacity )
+            {
+                h->write_pos = 0;
+            }
+        }
+    }
+
+    if ( h->read_pos == h->write_pos )
+    {
+        h->is_full = 1;
+    }
+
+    return;
+}
+
+
+/*---------------------------------------------------------------------*
+ * ivas_TD_RINGBUF_PushZeros()
+ *
+ * Push zero samples onto the back of the TD ring buffer.
+ *---------------------------------------------------------------------*/
+
+void ivas_TD_RINGBUF_PushZeros(
+    TD_RINGBUF_HANDLE h,                   /* i/o: Ring buffer handle                   */
+    const uint32_t num_samples_per_channel /* i  : Number of zeros per channel to store */
+)
+{
+    uint32_t s;
+    uint16_t c;
+
+    assert( ivas_td_ringbuf_has_space_for_num_samples( h, num_samples_per_channel * h->num_channels ) );
+    if ( !num_samples_per_channel )
+    {
+        return;
+    }
+
+    for ( s = 0; s < num_samples_per_channel; ++s )
+    {
+        for ( c = 0; c < h->num_channels; ++c )
+        {
+            h->data[h->write_pos] = 0.f;
+            ++h->write_pos;
+
+            if ( h->write_pos == h->capacity )
+            {
+                h->write_pos = 0;
+            }
+        }
+    }
+
+    if ( h->read_pos == h->write_pos )
+    {
+        h->is_full = 1;
+    }
+
+    return;
+}
+
+
+/*---------------------------------------------------------------------*
+ * ivas_TD_RINGBUF_Pop()
+ *
+ * Pop samples from the front of the TD ring buffer.
+ *---------------------------------------------------------------------*/
+
+void ivas_TD_RINGBUF_Pop(
+    TD_RINGBUF_HANDLE h,                   /* i/o: Ring buffer handle                           */
+    float *data,                           /* i  : Output data                                  */
+    const uint32_t num_samples_per_channel /* i  : Number of samples per channel to retrieve    */
+)
+{
+    uint32_t s;
+    uint16_t c;
+
+    assert( ivas_td_ringbuf_total_size( h ) >= num_samples_per_channel * h->num_channels );
+
+    for ( s = 0; s < num_samples_per_channel; ++s )
+    {
+        for ( c = 0; c < h->num_channels; ++c )
+        {
+            *( data + c * num_samples_per_channel + s ) = h->data[h->read_pos];
+            ++h->read_pos;
+
+            if ( h->read_pos == h->capacity )
+            {
+                h->read_pos = 0;
+            }
+        }
+    }
+
+    if ( h->is_full )
+    {
+        h->is_full = 0;
+    }
+
+    return;
+}
+
+
+/*---------------------------------------------------------------------*
+ * ivas_TD_RINGBUF_Size()
+ *
+ * Returns number of buffered samples per channel.
+ *---------------------------------------------------------------------*/
+
+uint32_t ivas_TD_RINGBUF_Size(
+    const TD_RINGBUF_HANDLE h /* i  : Ring buffer handle */
+)
+{
+    return ivas_td_ringbuf_total_size( h ) / (uint32_t) h->num_channels;
+}
diff --git a/lib_rend/lib_rend.c b/lib_rend/lib_rend.c
index a621956a9..54b55108f 100644
--- a/lib_rend/lib_rend.c
+++ b/lib_rend/lib_rend.c
@@ -3681,11 +3681,7 @@ static int16_t getCldfbRendFlag(
             numSbaInputs += ( hIvasRend->inputsSba[i].base.inConfig == IVAS_AUDIO_CONFIG_INVALID && new_configType != IVAS_REND_AUDIO_CONFIG_TYPE_AMBISONICS ) ? 0 : 1;
         }
 
-        if ( numIsmInputs > 0 || numMcInputs > 0 )
-        {
-            isCldfbRend = 0;
-        }
-        else if ( ( numMasaInputs > 0 ) || ( numSbaInputs > 0 && hIvasRend->hRendererConfig->split_rend_config.rendererSelection == IVAS_BIN_RENDERER_TYPE_FASTCONV ) )
+        if ( ( numMasaInputs > 0 ) || ( numSbaInputs > 0 && hIvasRend->hRendererConfig->split_rend_config.rendererSelection == IVAS_BIN_RENDERER_TYPE_FASTCONV ) )
         {
             isCldfbRend = 1;
         }
-- 
GitLab


From 9d09e4b52b656736a6e846012e89d122a0e13dc7 Mon Sep 17 00:00:00 2001
From: Kacper Sagnowski <kacper.sagnowski@iis.fraunhofer.de>
Date: Mon, 20 Oct 2025 14:15:51 +0200
Subject: [PATCH 04/12] Improve documentation comments for TD ring buffer

---
 lib_rend/ivas_stat_rend.h      | 4 ++--
 lib_rend/ivas_td_ring_buffer.c | 6 ++++++
 2 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/lib_rend/ivas_stat_rend.h b/lib_rend/ivas_stat_rend.h
index b9c560afe..011b44ff0 100644
--- a/lib_rend/ivas_stat_rend.h
+++ b/lib_rend/ivas_stat_rend.h
@@ -1381,8 +1381,8 @@ typedef struct
 
 typedef struct
 {
-    float *data; /* samples in interleaved layout */
-    uint32_t capacity;
+    float *data;       /* samples in interleaved layout, e.g. for channels A, B, C, samples are stored: A1, B1, C1, A2, B2, C2, ... */
+    uint32_t capacity; /* max number of float values that can be stored */
     uint16_t num_channels;
     uint32_t write_pos;
     uint32_t read_pos;
diff --git a/lib_rend/ivas_td_ring_buffer.c b/lib_rend/ivas_td_ring_buffer.c
index 5c9c6089b..a580fe549 100644
--- a/lib_rend/ivas_td_ring_buffer.c
+++ b/lib_rend/ivas_td_ring_buffer.c
@@ -42,6 +42,12 @@
  * Local function prototypes
  *-----------------------------------------------------------------------*/
 
+/*---------------------------------------------------------------------*
+ * ivas_td_ringbuf_total_size()
+ *
+ * Returns total number of buffered samples (including number of channels)
+ *---------------------------------------------------------------------*/
+
 static uint32_t ivas_td_ringbuf_total_size(
     TD_RINGBUF_HANDLE h )
 {
-- 
GitLab


From 058a764376b587dc239a9c3bd10ee645516795c9 Mon Sep 17 00:00:00 2001
From: Jan Kiene <jan.kiene@iis.fraunhofer.de>
Date: Fri, 24 Oct 2025 17:08:33 +0200
Subject: [PATCH 05/12] turn md delay renderer argument into integer type

---
 apps/renderer.c     |  5 +++--
 lib_rend/lib_rend.c | 33 ++++++++++++---------------------
 lib_rend/lib_rend.h |  2 +-
 3 files changed, 16 insertions(+), 24 deletions(-)

diff --git a/apps/renderer.c b/apps/renderer.c
index 3f8c479d9..eccabd2a6 100644
--- a/apps/renderer.c
+++ b/apps/renderer.c
@@ -33,6 +33,7 @@
 #include "lib_rend.h"
 #include <assert.h>
 #include <math.h>
+#include <stdint.h>
 #include <string.h>
 #include "audio_file_reader.h"
 #include "audio_file_writer.h"
@@ -186,7 +187,7 @@ typedef struct
     float lfeConfigElevation;
     bool lfeCustomRoutingEnabled;
     char inLfePanningMatrixFile[RENDERER_MAX_CLI_ARG_LENGTH];
-    float syncMdDelay;
+    int16_t syncMdDelay;
     IVAS_RENDER_FRAMESIZE render_framesize;
     uint16_t directivityPatternId[RENDERER_MAX_ISM_INPUTS];
     AcousticEnvironmentSequence aeSequence;
@@ -2904,7 +2905,7 @@ static void parseOption(
         case CmdLnOptionId_syncMdDelay:
             assert( numOptionValues == 1 );
             /* Metadata Delay to sync with audio delay in ms */
-            args->syncMdDelay = strtof( optionValues[0], NULL );
+            args->syncMdDelay = (int16_t) strtol( optionValues[0], NULL, 10 );
             break;
         default:
             assert( 0 && "This should be unreachable - all command line options should be explicitly handled." );
diff --git a/lib_rend/lib_rend.c b/lib_rend/lib_rend.c
index be092691f..a479af20f 100644
--- a/lib_rend/lib_rend.c
+++ b/lib_rend/lib_rend.c
@@ -44,6 +44,7 @@
 #include <math.h>
 #include <stdbool.h>
 #include "wmc_auto.h"
+#include <stdint.h>
 
 
 /*-------------------------------------------------------------------*
@@ -125,7 +126,7 @@ typedef struct
 #ifdef NONBE_1377_REND_DIRATT_CONF
     int16_t object_id;
 #endif
-    float ism_metadata_delay_ms;
+    int16_t ism_metadata_delay_ms;
 } input_ism;
 
 typedef struct
@@ -1510,7 +1511,7 @@ static ivas_error alignInputDelay(
             if ( getAudioConfigType( inputBase->inConfig ) == IVAS_REND_AUDIO_CONFIG_TYPE_OBJECT_BASED )
             {
                 inputIsm = (input_ism *) inputBase;
-                inputIsm->ism_metadata_delay_ms = maxGlobalDelayNs / 1e6f;
+                inputIsm->ism_metadata_delay_ms = (int16_t) roundf( inputIsm->ism_metadata_delay_ms + maxGlobalDelayNs / 1e6f / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
             }
         }
     }
@@ -5473,14 +5474,12 @@ static ivas_error renderIsmToBinaural(
 {
     float tmpTDRendBuffer[MAX_OUTPUT_CHANNELS][L_FRAME48k];
     ivas_error error;
-    int16_t ism_md_subframe_update_ext;
 
     push_wmops( "renderIsmToBinaural" );
-    /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
-    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
+
     copyBufferTo2dArray( ismInput->base.inputBuffer, tmpTDRendBuffer );
 
-    if ( ( error = ivas_td_binaural_renderer_ext( &ismInput->tdRendWrapper, ismInput->base.inConfig, NULL, ismInput->base.ctx.pCombinedOrientationData, &ismInput->currentPos, ismInput->hReverb, ism_md_subframe_update_ext,
+    if ( ( error = ivas_td_binaural_renderer_ext( &ismInput->tdRendWrapper, ismInput->base.inConfig, NULL, ismInput->base.ctx.pCombinedOrientationData, &ismInput->currentPos, ismInput->hReverb, ismInput->ism_metadata_delay_ms,
                                                   *ismInput->base.ctx.pOutSampleRate, outAudio.config.numSamplesPerChannel, tmpTDRendBuffer ) ) != IVAS_ERR_OK )
     {
         return error;
@@ -5675,17 +5674,13 @@ static ivas_error renderIsmToBinauralReverb(
 {
     float tmpRendBuffer[MAX_OUTPUT_CHANNELS][L_FRAME48k];
     ivas_error error;
-    int16_t ism_md_subframe_update_ext;
 
     push_wmops( "renderIsmToBinauralRoom" );
 
-    /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
-    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
-
     copyBufferTo2dArray( ismInput->base.inputBuffer, tmpRendBuffer );
 
     if ( ( error = ivas_td_binaural_renderer_ext( &ismInput->tdRendWrapper, ismInput->base.inConfig, NULL, ismInput->base.ctx.pCombinedOrientationData, &ismInput->currentPos, ismInput->hReverb,
-                                                  ism_md_subframe_update_ext, *ismInput->base.ctx.pOutSampleRate, outAudio.config.numSamplesPerChannel, tmpRendBuffer ) ) != IVAS_ERR_OK )
+                                                  ismInput->ism_metadata_delay_ms, *ismInput->base.ctx.pOutSampleRate, outAudio.config.numSamplesPerChannel, tmpRendBuffer ) ) != IVAS_ERR_OK )
     {
         return error;
     }
@@ -5852,16 +5847,12 @@ static ivas_error renderIsmToSplitBinaural(
     float tmpBinaural_CldfbIm[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS][CLDFB_NO_COL_MAX][CLDFB_NO_CHANNELS_MAX];
     int16_t output_frame = ismInput->base.inputBuffer.config.numSamplesPerChannel;
     COMBINED_ORIENTATION_HANDLE pCombinedOrientationData;
-    int16_t ism_md_subframe_update_ext;
 
     push_wmops( "renderIsmToSplitBinaural" );
 
     pSplitRendWrapper = ismInput->base.ctx.pSplitRendWrapper;
     pMultiBinPoseData = &pSplitRendWrapper->multiBinPoseData;
 
-    /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
-    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
-
     pCombinedOrientationData = *ismInput->base.ctx.pCombinedOrientationData;
 
     if ( pMultiBinPoseData->poseCorrectionMode == ISAR_SPLIT_REND_POSE_CORRECTION_MODE_CLDFB )
@@ -5911,7 +5902,7 @@ static ivas_error renderIsmToSplitBinaural(
 
         /* Render */
         if ( ( error = ivas_td_binaural_renderer_ext( ( pos_idx == 0 ) ? &ismInput->tdRendWrapper : &ismInput->splitTdRendWrappers[pos_idx - 1], ismInput->base.inConfig, NULL, ismInput->base.ctx.pCombinedOrientationData, &ismInput->currentPos,
-                                                      NULL, ism_md_subframe_update_ext, *ismInput->base.ctx.pOutSampleRate, output_frame, tmpProcessing ) ) != IVAS_ERR_OK )
+                                                      NULL, ismInput->ism_metadata_delay_ms, *ismInput->base.ctx.pOutSampleRate, output_frame, tmpProcessing ) ) != IVAS_ERR_OK )
         {
             return error;
         }
@@ -7585,8 +7576,8 @@ ivas_error IVAS_REND_MergeMasaMetadata(
 )
 {
     MASA_DECODER_EXT_OUT_META_HANDLE inMeta2;
-    float( *inEne1 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
-    float( *inEne2 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
+    float ( *inEne1 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
+    float ( *inEne2 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
 
     if ( hIvasRend == NULL )
     {
@@ -7683,7 +7674,7 @@ ivas_error IVAS_REND_SetTotalNumberOfObjects(
 
 ivas_error IVAS_REND_SetIsmMetadataDelay(
     IVAS_REND_HANDLE hIvasRend, /* i/o: IVAS renderer handle    */
-    const float sync_md_delay   /* i  : ISM Metadata Delay in ms to sync with audio delay   */
+    const int16_t sync_md_delay /* i  : ISM Metadata Delay in ms to sync with audio delay   */
 )
 {
     int16_t i;
@@ -7695,7 +7686,7 @@ ivas_error IVAS_REND_SetIsmMetadataDelay(
 
     for ( i = 0; i < RENDERER_MAX_ISM_INPUTS; ++i )
     {
-        hIvasRend->inputsIsm[i].ism_metadata_delay_ms = sync_md_delay;
+        hIvasRend->inputsIsm[i].ism_metadata_delay_ms = (int16_t) roundf( sync_md_delay / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
     }
 
     return IVAS_ERR_OK;
@@ -7942,7 +7933,7 @@ ivas_error IVAS_REND_GetSplitBinauralBitstream(
                                                           &bits,
                                                           Cldfb_RealBuffer_Binaural,
                                                           Cldfb_ImagBuffer_Binaural,
-                                                          ( const int16_t )( ( BINAURAL_MAXBANDS * hIvasRend->sampleRateOut ) / 48000 ),
+                                                          (const int16_t) ( ( BINAURAL_MAXBANDS * hIvasRend->sampleRateOut ) / 48000 ),
                                                           tmpBinaural,
                                                           1,
                                                           cldfb_in_flag,
diff --git a/lib_rend/lib_rend.h b/lib_rend/lib_rend.h
index 211fd0d6e..f2cf92e08 100644
--- a/lib_rend/lib_rend.h
+++ b/lib_rend/lib_rend.h
@@ -380,7 +380,7 @@ ivas_error IVAS_REND_SetTotalNumberOfObjects(
 
 ivas_error IVAS_REND_SetIsmMetadataDelay(
     IVAS_REND_HANDLE hIvasRend,                     /* i/o: IVAS renderer handle                                */
-    const float sync_md_delay                       /* i  :   Metadata Delay in ms to sync with audio delay     */
+    const int16_t sync_md_delay                       /* i  :   Metadata Delay in ms to sync with audio delay     */
 );
 
 ivas_error IVAS_REND_GetNumAllObjects(
-- 
GitLab


From 27771584f23bdc88c8e7c1a75b76435f72cee10d Mon Sep 17 00:00:00 2001
From: Jan Kiene <jan.kiene@iis.fraunhofer.de>
Date: Wed, 29 Oct 2025 14:48:01 +0100
Subject: [PATCH 06/12] make sure to store delay in ms and not already in
 subframe indexes

---
 lib_rend/lib_rend.c | 20 +++++++++++++++-----
 1 file changed, 15 insertions(+), 5 deletions(-)

diff --git a/lib_rend/lib_rend.c b/lib_rend/lib_rend.c
index a479af20f..a21401e2f 100644
--- a/lib_rend/lib_rend.c
+++ b/lib_rend/lib_rend.c
@@ -1511,7 +1511,7 @@ static ivas_error alignInputDelay(
             if ( getAudioConfigType( inputBase->inConfig ) == IVAS_REND_AUDIO_CONFIG_TYPE_OBJECT_BASED )
             {
                 inputIsm = (input_ism *) inputBase;
-                inputIsm->ism_metadata_delay_ms = (int16_t) roundf( inputIsm->ism_metadata_delay_ms + maxGlobalDelayNs / 1e6f / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
+                inputIsm->ism_metadata_delay_ms = (int16_t) roundf( inputIsm->ism_metadata_delay_ms + maxGlobalDelayNs / 1e6f );
             }
         }
     }
@@ -5474,12 +5474,15 @@ static ivas_error renderIsmToBinaural(
 {
     float tmpTDRendBuffer[MAX_OUTPUT_CHANNELS][L_FRAME48k];
     ivas_error error;
+    int16_t ism_md_subframe_update_ext;
 
     push_wmops( "renderIsmToBinaural" );
 
+    /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
+    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
     copyBufferTo2dArray( ismInput->base.inputBuffer, tmpTDRendBuffer );
 
-    if ( ( error = ivas_td_binaural_renderer_ext( &ismInput->tdRendWrapper, ismInput->base.inConfig, NULL, ismInput->base.ctx.pCombinedOrientationData, &ismInput->currentPos, ismInput->hReverb, ismInput->ism_metadata_delay_ms,
+    if ( ( error = ivas_td_binaural_renderer_ext( &ismInput->tdRendWrapper, ismInput->base.inConfig, NULL, ismInput->base.ctx.pCombinedOrientationData, &ismInput->currentPos, ismInput->hReverb, ism_md_subframe_update_ext,
                                                   *ismInput->base.ctx.pOutSampleRate, outAudio.config.numSamplesPerChannel, tmpTDRendBuffer ) ) != IVAS_ERR_OK )
     {
         return error;
@@ -5674,13 +5677,16 @@ static ivas_error renderIsmToBinauralReverb(
 {
     float tmpRendBuffer[MAX_OUTPUT_CHANNELS][L_FRAME48k];
     ivas_error error;
+    int16_t ism_md_subframe_update_ext;
 
     push_wmops( "renderIsmToBinauralRoom" );
 
+    /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
+    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
     copyBufferTo2dArray( ismInput->base.inputBuffer, tmpRendBuffer );
 
     if ( ( error = ivas_td_binaural_renderer_ext( &ismInput->tdRendWrapper, ismInput->base.inConfig, NULL, ismInput->base.ctx.pCombinedOrientationData, &ismInput->currentPos, ismInput->hReverb,
-                                                  ismInput->ism_metadata_delay_ms, *ismInput->base.ctx.pOutSampleRate, outAudio.config.numSamplesPerChannel, tmpRendBuffer ) ) != IVAS_ERR_OK )
+                                                  ism_md_subframe_update_ext, *ismInput->base.ctx.pOutSampleRate, outAudio.config.numSamplesPerChannel, tmpRendBuffer ) ) != IVAS_ERR_OK )
     {
         return error;
     }
@@ -5847,12 +5853,16 @@ static ivas_error renderIsmToSplitBinaural(
     float tmpBinaural_CldfbIm[MAX_HEAD_ROT_POSES * BINAURAL_CHANNELS][CLDFB_NO_COL_MAX][CLDFB_NO_CHANNELS_MAX];
     int16_t output_frame = ismInput->base.inputBuffer.config.numSamplesPerChannel;
     COMBINED_ORIENTATION_HANDLE pCombinedOrientationData;
+    int16_t ism_md_subframe_update_ext;
 
     push_wmops( "renderIsmToSplitBinaural" );
 
     pSplitRendWrapper = ismInput->base.ctx.pSplitRendWrapper;
     pMultiBinPoseData = &pSplitRendWrapper->multiBinPoseData;
 
+    /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
+    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
+
     pCombinedOrientationData = *ismInput->base.ctx.pCombinedOrientationData;
 
     if ( pMultiBinPoseData->poseCorrectionMode == ISAR_SPLIT_REND_POSE_CORRECTION_MODE_CLDFB )
@@ -5902,7 +5912,7 @@ static ivas_error renderIsmToSplitBinaural(
 
         /* Render */
         if ( ( error = ivas_td_binaural_renderer_ext( ( pos_idx == 0 ) ? &ismInput->tdRendWrapper : &ismInput->splitTdRendWrappers[pos_idx - 1], ismInput->base.inConfig, NULL, ismInput->base.ctx.pCombinedOrientationData, &ismInput->currentPos,
-                                                      NULL, ismInput->ism_metadata_delay_ms, *ismInput->base.ctx.pOutSampleRate, output_frame, tmpProcessing ) ) != IVAS_ERR_OK )
+                                                      NULL, ism_md_subframe_update_ext, *ismInput->base.ctx.pOutSampleRate, output_frame, tmpProcessing ) ) != IVAS_ERR_OK )
         {
             return error;
         }
@@ -7686,7 +7696,7 @@ ivas_error IVAS_REND_SetIsmMetadataDelay(
 
     for ( i = 0; i < RENDERER_MAX_ISM_INPUTS; ++i )
     {
-        hIvasRend->inputsIsm[i].ism_metadata_delay_ms = (int16_t) roundf( sync_md_delay / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
+        hIvasRend->inputsIsm[i].ism_metadata_delay_ms = sync_md_delay;
     }
 
     return IVAS_ERR_OK;
-- 
GitLab


From 07ef3ad1cb901d96fa038b1c225dba8d9904f39b Mon Sep 17 00:00:00 2001
From: Jan Kiene <jan.kiene@iis.fraunhofer.de>
Date: Wed, 29 Oct 2025 15:07:13 +0100
Subject: [PATCH 07/12] use single constant instead of multiple ones

---
 lib_rend/lib_rend.c | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/lib_rend/lib_rend.c b/lib_rend/lib_rend.c
index a21401e2f..a0da4e4b3 100644
--- a/lib_rend/lib_rend.c
+++ b/lib_rend/lib_rend.c
@@ -5479,7 +5479,7 @@ static ivas_error renderIsmToBinaural(
     push_wmops( "renderIsmToBinaural" );
 
     /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
-    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
+    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / (float) BINAURAL_RENDERING_FRAME_SIZE_MS );
     copyBufferTo2dArray( ismInput->base.inputBuffer, tmpTDRendBuffer );
 
     if ( ( error = ivas_td_binaural_renderer_ext( &ismInput->tdRendWrapper, ismInput->base.inConfig, NULL, ismInput->base.ctx.pCombinedOrientationData, &ismInput->currentPos, ismInput->hReverb, ism_md_subframe_update_ext,
@@ -5682,7 +5682,7 @@ static ivas_error renderIsmToBinauralReverb(
     push_wmops( "renderIsmToBinauralRoom" );
 
     /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
-    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
+    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / (float) BINAURAL_RENDERING_FRAME_SIZE_MS );
     copyBufferTo2dArray( ismInput->base.inputBuffer, tmpRendBuffer );
 
     if ( ( error = ivas_td_binaural_renderer_ext( &ismInput->tdRendWrapper, ismInput->base.inConfig, NULL, ismInput->base.ctx.pCombinedOrientationData, &ismInput->currentPos, ismInput->hReverb,
@@ -5861,7 +5861,7 @@ static ivas_error renderIsmToSplitBinaural(
     pMultiBinPoseData = &pSplitRendWrapper->multiBinPoseData;
 
     /* Metadata Delay to sync with audio delay converted from ms to 5ms (1000/50/4) subframe index */
-    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / ( 1000.f / FRAMES_PER_SEC / MAX_PARAM_SPATIAL_SUBFRAMES ) );
+    ism_md_subframe_update_ext = (int16_t) roundf( ismInput->ism_metadata_delay_ms / (float) BINAURAL_RENDERING_FRAME_SIZE_MS );
 
     pCombinedOrientationData = *ismInput->base.ctx.pCombinedOrientationData;
 
-- 
GitLab


From cd41e576f5adbb8ee288dfae009d3843f885a6bb Mon Sep 17 00:00:00 2001
From: Jan Kiene <jan.kiene@iis.fraunhofer.de>
Date: Wed, 29 Oct 2025 18:16:06 +0100
Subject: [PATCH 08/12] clang-format

---
 lib_rend/lib_rend.c | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/lib_rend/lib_rend.c b/lib_rend/lib_rend.c
index 4d0dfcbea..b910be38b 100644
--- a/lib_rend/lib_rend.c
+++ b/lib_rend/lib_rend.c
@@ -7649,8 +7649,8 @@ ivas_error IVAS_REND_MergeMasaMetadata(
 )
 {
     MASA_DECODER_EXT_OUT_META_HANDLE inMeta2;
-    float ( *inEne1 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
-    float ( *inEne2 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
+    float( *inEne1 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
+    float( *inEne2 )[MAX_PARAM_SPATIAL_SUBFRAMES][MASA_FREQUENCY_BANDS];
 
     if ( hIvasRend == NULL )
     {
@@ -8006,7 +8006,7 @@ ivas_error IVAS_REND_GetSplitBinauralBitstream(
                                                           &bits,
                                                           Cldfb_RealBuffer_Binaural,
                                                           Cldfb_ImagBuffer_Binaural,
-                                                          (const int16_t) ( ( BINAURAL_MAXBANDS * hIvasRend->sampleRateOut ) / 48000 ),
+                                                          ( const int16_t )( ( BINAURAL_MAXBANDS * hIvasRend->sampleRateOut ) / 48000 ),
                                                           tmpBinaural,
                                                           1,
                                                           cldfb_in_flag,
-- 
GitLab


From bc892a1436e137b055e10bc9e81d73cab0133649 Mon Sep 17 00:00:00 2001
From: Jan Kiene <jan.kiene@iis.fraunhofer.de>
Date: Wed, 29 Oct 2025 18:47:02 +0100
Subject: [PATCH 09/12] align data type between field and function returns

---
 lib_rend/lib_rend.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib_rend/lib_rend.c b/lib_rend/lib_rend.c
index b910be38b..5d64c144d 100644
--- a/lib_rend/lib_rend.c
+++ b/lib_rend/lib_rend.c
@@ -103,7 +103,7 @@ typedef struct
     float gain; /* Linear, not in dB */
     rendering_context ctx;
     int32_t numNewSamplesPerChannel; /* Used to keep track how much new audio was fed before rendering current frame */
-    int32_t delayNumSamples;
+    int16_t delayNumSamples;
 } input_base;
 
 typedef struct
-- 
GitLab


From c27f49dee78e20c629460af30c0c512619046814 Mon Sep 17 00:00:00 2001
From: Jan Kiene <jan.kiene@iis.fraunhofer.de>
Date: Thu, 30 Oct 2025 14:53:35 +0100
Subject: [PATCH 10/12] change from 32bit to 16bit integer for
 num_samples_per_channel vars

---
 lib_rend/ivas_prot_rend.h      | 10 +++++-----
 lib_rend/ivas_td_ring_buffer.c | 22 ++++++++++------------
 lib_rend/lib_rend.c            |  8 ++++----
 3 files changed, 19 insertions(+), 21 deletions(-)

diff --git a/lib_rend/ivas_prot_rend.h b/lib_rend/ivas_prot_rend.h
index b00bfff2a..954baea3e 100644
--- a/lib_rend/ivas_prot_rend.h
+++ b/lib_rend/ivas_prot_rend.h
@@ -1599,7 +1599,7 @@ void ivas_rend_closeCldfbRend(
 
 ivas_error ivas_TD_RINGBUF_Open(
     TD_RINGBUF_HANDLE *ph,                                      /* i/o: Ring buffer handle                     */
-    const uint32_t capacity_per_channel,                        /* i  : Number of samples stored per channel   */
+    const uint16_t capacity_per_channel,                        /* i  : Number of samples stored per channel   */
     const uint16_t num_channels                                 /* i  : Number of channels                     */
 );
 
@@ -1610,21 +1610,21 @@ void ivas_TD_RINGBUF_Close(
 void ivas_TD_RINGBUF_Push( 
     TD_RINGBUF_HANDLE h,                                        /* i/o: Ring buffer handle                       */
     const float *data,                                          /* i  : Input data                               */
-    const uint32_t num_samples_per_channel                      /* i  : Number of samples per channel to store   */
+    const uint16_t num_samples_per_channel                      /* i  : Number of samples per channel to store   */
 );
 
 void ivas_TD_RINGBUF_PushZeros( 
     TD_RINGBUF_HANDLE h,                                        /* i/o: Ring buffer handle                      */
-    const uint32_t num_samples_per_channel                      /* i  : Number of zeros per channel to store    */
+    const uint16_t num_samples_per_channel                      /* i  : Number of zeros per channel to store    */
 );
 
 void ivas_TD_RINGBUF_Pop( 
     TD_RINGBUF_HANDLE h,                                        /* i/o: Ring buffer handle                      */
     float *data,                                                /* i  : Output data                             */
-    const uint32_t num_samples_per_channel                      /* i  : Number of samples per channel to retrieve*/
+    const uint16_t num_samples_per_channel                      /* i  : Number of samples per channel to retrieve*/
 );
 
-uint32_t ivas_TD_RINGBUF_Size(
+uint16_t ivas_TD_RINGBUF_Size(
     const TD_RINGBUF_HANDLE h                                   /* i  : Ring buffer handle                      */
 );
 
diff --git a/lib_rend/ivas_td_ring_buffer.c b/lib_rend/ivas_td_ring_buffer.c
index a580fe549..df60114ca 100644
--- a/lib_rend/ivas_td_ring_buffer.c
+++ b/lib_rend/ivas_td_ring_buffer.c
@@ -31,6 +31,7 @@
 *******************************************************************************************************/
 
 #include <assert.h>
+#include <stdint.h>
 #include <stdlib.h>
 #include "ivas_error_utils.h"
 #include "ivas_prot_rend.h"
@@ -87,7 +88,7 @@ static int16_t ivas_td_ringbuf_has_space_for_num_samples(
 
 ivas_error ivas_TD_RINGBUF_Open(
     TD_RINGBUF_HANDLE *ph,               /* i/o: Ring buffer handle                     */
-    const uint32_t capacity_per_channel, /* i  : Number of samples stored per channel   */
+    const uint16_t capacity_per_channel, /* i  : Number of samples stored per channel   */
     const uint16_t num_channels          /* i  : Number of channels                     */
 )
 {
@@ -166,11 +167,10 @@ void ivas_TD_RINGBUF_Close(
 void ivas_TD_RINGBUF_Push(
     TD_RINGBUF_HANDLE h,                   /* i/o: Ring buffer handle                       */
     const float *data,                     /* i  : Input data                               */
-    const uint32_t num_samples_per_channel /* i  : Number of samples per channel to store   */
+    const uint16_t num_samples_per_channel /* i  : Number of samples per channel to store   */
 )
 {
-    uint32_t s;
-    uint16_t c;
+    uint16_t c, s;
 
     assert( ivas_td_ringbuf_has_space_for_num_samples( h, num_samples_per_channel * h->num_channels ) );
 
@@ -205,11 +205,10 @@ void ivas_TD_RINGBUF_Push(
 
 void ivas_TD_RINGBUF_PushZeros(
     TD_RINGBUF_HANDLE h,                   /* i/o: Ring buffer handle                   */
-    const uint32_t num_samples_per_channel /* i  : Number of zeros per channel to store */
+    const uint16_t num_samples_per_channel /* i  : Number of zeros per channel to store */
 )
 {
-    uint32_t s;
-    uint16_t c;
+    uint16_t c, s;
 
     assert( ivas_td_ringbuf_has_space_for_num_samples( h, num_samples_per_channel * h->num_channels ) );
     if ( !num_samples_per_channel )
@@ -249,11 +248,10 @@ void ivas_TD_RINGBUF_PushZeros(
 void ivas_TD_RINGBUF_Pop(
     TD_RINGBUF_HANDLE h,                   /* i/o: Ring buffer handle                           */
     float *data,                           /* i  : Output data                                  */
-    const uint32_t num_samples_per_channel /* i  : Number of samples per channel to retrieve    */
+    const uint16_t num_samples_per_channel /* i  : Number of samples per channel to retrieve    */
 )
 {
-    uint32_t s;
-    uint16_t c;
+    uint16_t c, s;
 
     assert( ivas_td_ringbuf_total_size( h ) >= num_samples_per_channel * h->num_channels );
 
@@ -286,9 +284,9 @@ void ivas_TD_RINGBUF_Pop(
  * Returns number of buffered samples per channel.
  *---------------------------------------------------------------------*/
 
-uint32_t ivas_TD_RINGBUF_Size(
+uint16_t ivas_TD_RINGBUF_Size(
     const TD_RINGBUF_HANDLE h /* i  : Ring buffer handle */
 )
 {
-    return ivas_td_ringbuf_total_size( h ) / (uint32_t) h->num_channels;
+    return (uint16_t) ( ivas_td_ringbuf_total_size( h ) / (uint32_t) h->num_channels );
 }
diff --git a/lib_rend/lib_rend.c b/lib_rend/lib_rend.c
index 5d64c144d..b9f35e062 100644
--- a/lib_rend/lib_rend.c
+++ b/lib_rend/lib_rend.c
@@ -1480,9 +1480,9 @@ static ivas_error alignInputDelay(
 {
     ivas_error error;
     input_ism *inputIsm;
-    int16_t maxGlobalDelaySamples;
-    int32_t numSamplesToPush, numSamplesToPop;
-    uint32_t ringBufferSize, preDelay;
+    int16_t maxGlobalDelaySamples, numSamplesToPop, numSamplesToPush;
+    uint16_t ringBufferSize;
+    uint32_t preDelay;
 
     maxGlobalDelaySamples = latencyNsToSamples( sampleRateOut, maxGlobalDelayNs );
     maxGlobalDelaySamples *= cldfb2tdSampleFact;
@@ -1521,7 +1521,7 @@ static ivas_error alignInputDelay(
         /* push in the new input data and pop to retrieve a complete input frame
          * if we are flushing the inputs, we don't push in any new data */
         numSamplesToPush = flushInputs ? 0 : inputAudio.config.numSamplesPerChannel;
-        numSamplesToPop = flushInputs ? ivas_TD_RINGBUF_Size( inputBase->delayBuffer ) : (uint32_t) inputAudio.config.numSamplesPerChannel;
+        numSamplesToPop = flushInputs ? ivas_TD_RINGBUF_Size( inputBase->delayBuffer ) : inputAudio.config.numSamplesPerChannel;
 
         ivas_TD_RINGBUF_Push( inputBase->delayBuffer, inputAudio.data, numSamplesToPush );
         ivas_TD_RINGBUF_Pop( inputBase->delayBuffer, inputBase->inputBuffer.data, numSamplesToPop );
-- 
GitLab


From b30592e32554fd8a559b6ac4ef3af3bd738ab651 Mon Sep 17 00:00:00 2001
From: Jan Kiene <jan.kiene@iis.fraunhofer.de>
Date: Thu, 30 Oct 2025 15:03:55 +0100
Subject: [PATCH 11/12] some more data type related changes

---
 lib_rend/ivas_td_ring_buffer.c | 2 +-
 lib_rend/lib_rend.c            | 3 +--
 2 files changed, 2 insertions(+), 3 deletions(-)

diff --git a/lib_rend/ivas_td_ring_buffer.c b/lib_rend/ivas_td_ring_buffer.c
index df60114ca..c497bbf81 100644
--- a/lib_rend/ivas_td_ring_buffer.c
+++ b/lib_rend/ivas_td_ring_buffer.c
@@ -253,7 +253,7 @@ void ivas_TD_RINGBUF_Pop(
 {
     uint16_t c, s;
 
-    assert( ivas_td_ringbuf_total_size( h ) >= num_samples_per_channel * h->num_channels );
+    assert( ivas_td_ringbuf_total_size( h ) >= (uint32_t) ( num_samples_per_channel * h->num_channels ) );
 
     for ( s = 0; s < num_samples_per_channel; ++s )
     {
diff --git a/lib_rend/lib_rend.c b/lib_rend/lib_rend.c
index b9f35e062..949a329ab 100644
--- a/lib_rend/lib_rend.c
+++ b/lib_rend/lib_rend.c
@@ -1481,8 +1481,7 @@ static ivas_error alignInputDelay(
     ivas_error error;
     input_ism *inputIsm;
     int16_t maxGlobalDelaySamples, numSamplesToPop, numSamplesToPush;
-    uint16_t ringBufferSize;
-    uint32_t preDelay;
+    uint16_t ringBufferSize, preDelay;
 
     maxGlobalDelaySamples = latencyNsToSamples( sampleRateOut, maxGlobalDelayNs );
     maxGlobalDelaySamples *= cldfb2tdSampleFact;
-- 
GitLab


From a464d58a92ab59954ce29c5521cd4b38576fd665 Mon Sep 17 00:00:00 2001
From: Jan Kiene <jan.kiene@iis.fraunhofer.de>
Date: Thu, 30 Oct 2025 15:17:59 +0100
Subject: [PATCH 12/12] change casting order

---
 lib_rend/ivas_td_ring_buffer.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib_rend/ivas_td_ring_buffer.c b/lib_rend/ivas_td_ring_buffer.c
index c497bbf81..7f1ff0288 100644
--- a/lib_rend/ivas_td_ring_buffer.c
+++ b/lib_rend/ivas_td_ring_buffer.c
@@ -253,7 +253,7 @@ void ivas_TD_RINGBUF_Pop(
 {
     uint16_t c, s;
 
-    assert( ivas_td_ringbuf_total_size( h ) >= (uint32_t) ( num_samples_per_channel * h->num_channels ) );
+    assert( ivas_td_ringbuf_total_size( h ) >= num_samples_per_channel * (uint32_t) h->num_channels );
 
     for ( s = 0; s < num_samples_per_channel; ++s )
     {
-- 
GitLab