mirror of
				https://gitlab.freedesktop.org/pipewire/pipewire.git
				synced 2025-11-03 09:01:54 -05:00 
			
		
		
		
	channelmix: read mix coefficients correctly
Fix 5p1 to stereo mixdown by reading the coefficients correctly. Align 5p1 to quad SSE and C implementation Fixes #272
This commit is contained in:
		
							parent
							
								
									613824ab0b
								
							
						
					
					
						commit
						4867edb947
					
				
					 2 changed files with 18 additions and 16 deletions
				
			
		| 
						 | 
					@ -295,10 +295,10 @@ channelmix_f32_5p1_2_c(struct channelmix *mix, uint32_t n_dst, void * SPA_RESTRI
 | 
				
			||||||
	const float **s = (const float **) src;
 | 
						const float **s = (const float **) src;
 | 
				
			||||||
	const float v0 = mix->matrix[0][0];
 | 
						const float v0 = mix->matrix[0][0];
 | 
				
			||||||
	const float v1 = mix->matrix[1][1];
 | 
						const float v1 = mix->matrix[1][1];
 | 
				
			||||||
	const float clev = mix->matrix[2][0];
 | 
						const float clev = (mix->matrix[0][2] + mix->matrix[1][2]) * 0.5f;
 | 
				
			||||||
	const float llev = mix->matrix[3][0];
 | 
						const float llev = (mix->matrix[0][3] + mix->matrix[1][3]) * 0.5f;
 | 
				
			||||||
	const float slev0 = mix->matrix[4][0];
 | 
						const float slev0 = mix->matrix[0][4];
 | 
				
			||||||
	const float slev1 = mix->matrix[4][1];
 | 
						const float slev1 = mix->matrix[1][5];
 | 
				
			||||||
 | 
					
 | 
				
			||||||
	if (mix->zero) {
 | 
						if (mix->zero) {
 | 
				
			||||||
		memset(d[0], 0, n_samples * sizeof(float));
 | 
							memset(d[0], 0, n_samples * sizeof(float));
 | 
				
			||||||
| 
						 | 
					@ -350,8 +350,8 @@ channelmix_f32_5p1_4_c(struct channelmix *mix, uint32_t n_dst, void * SPA_RESTRI
 | 
				
			||||||
	uint32_t i, n;
 | 
						uint32_t i, n;
 | 
				
			||||||
	float **d = (float **) dst;
 | 
						float **d = (float **) dst;
 | 
				
			||||||
	const float **s = (const float **) src;
 | 
						const float **s = (const float **) src;
 | 
				
			||||||
	const float clev = mix->matrix[2][0];
 | 
						const float clev = mix->matrix[0][2];
 | 
				
			||||||
	const float llev = mix->matrix[3][0];
 | 
						const float llev = mix->matrix[0][3];
 | 
				
			||||||
	const float v0 = mix->matrix[0][0];
 | 
						const float v0 = mix->matrix[0][0];
 | 
				
			||||||
	const float v1 = mix->matrix[1][1];
 | 
						const float v1 = mix->matrix[1][1];
 | 
				
			||||||
	const float v4 = mix->matrix[2][4];
 | 
						const float v4 = mix->matrix[2][4];
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
| 
						 | 
					@ -145,10 +145,10 @@ channelmix_f32_5p1_2_sse(struct channelmix *mix, uint32_t n_dst, void * SPA_REST
 | 
				
			||||||
	const float **s = (const float **) src;
 | 
						const float **s = (const float **) src;
 | 
				
			||||||
	const __m128 v0 = _mm_set1_ps(mix->matrix[0][0]);
 | 
						const __m128 v0 = _mm_set1_ps(mix->matrix[0][0]);
 | 
				
			||||||
	const __m128 v1 = _mm_set1_ps(mix->matrix[1][1]);
 | 
						const __m128 v1 = _mm_set1_ps(mix->matrix[1][1]);
 | 
				
			||||||
	const __m128 clev = _mm_set1_ps(mix->matrix[2][0]);
 | 
						const __m128 clev = _mm_set1_ps((mix->matrix[0][2] + mix->matrix[1][2]) * 0.5f);
 | 
				
			||||||
	const __m128 llev = _mm_set1_ps(mix->matrix[3][0]);
 | 
						const __m128 llev = _mm_set1_ps((mix->matrix[0][3] + mix->matrix[1][3]) * 0.5f);
 | 
				
			||||||
	const __m128 slev0 = _mm_set1_ps(mix->matrix[4][0]);
 | 
						const __m128 slev0 = _mm_set1_ps(mix->matrix[0][4]);
 | 
				
			||||||
	const __m128 slev1 = _mm_set1_ps(mix->matrix[4][1]);
 | 
						const __m128 slev1 = _mm_set1_ps(mix->matrix[1][5]);
 | 
				
			||||||
	__m128 in, ctr;
 | 
						__m128 in, ctr;
 | 
				
			||||||
	const float *sFL = s[0], *sFR = s[1], *sFC = s[2], *sLFE = s[3], *sSL = s[4], *sSR = s[5];
 | 
						const float *sFL = s[0], *sFR = s[1], *sFC = s[2], *sLFE = s[3], *sSL = s[4], *sSR = s[5];
 | 
				
			||||||
	float *dFL = d[0], *dFR = d[1];
 | 
						float *dFL = d[0], *dFR = d[1];
 | 
				
			||||||
| 
						 | 
					@ -313,10 +313,12 @@ channelmix_f32_5p1_4_sse(struct channelmix *mix, uint32_t n_dst, void * SPA_REST
 | 
				
			||||||
	uint32_t i, n, unrolled;
 | 
						uint32_t i, n, unrolled;
 | 
				
			||||||
	float **d = (float **) dst;
 | 
						float **d = (float **) dst;
 | 
				
			||||||
	const float **s = (const float **) src;
 | 
						const float **s = (const float **) src;
 | 
				
			||||||
	const __m128 clev = _mm_set1_ps(mix->matrix[2][2]);
 | 
						const __m128 clev = _mm_set1_ps(mix->matrix[0][2]);
 | 
				
			||||||
	const __m128 llev = _mm_set1_ps(mix->matrix[3][3]);
 | 
						const __m128 llev = _mm_set1_ps(mix->matrix[0][3]);
 | 
				
			||||||
	const __m128 v0 = _mm_set1_ps(mix->matrix[0][0]);
 | 
						const __m128 v0 = _mm_set1_ps(mix->matrix[0][0]);
 | 
				
			||||||
	const __m128 v1 = _mm_set1_ps(mix->matrix[1][1]);
 | 
						const __m128 v1 = _mm_set1_ps(mix->matrix[1][1]);
 | 
				
			||||||
 | 
						const __m128 v4 = _mm_set1_ps(mix->matrix[2][4]);
 | 
				
			||||||
 | 
						const __m128 v5 = _mm_set1_ps(mix->matrix[3][5]);
 | 
				
			||||||
	__m128 ctr;
 | 
						__m128 ctr;
 | 
				
			||||||
	const float *sFL = s[0], *sFR = s[1], *sFC = s[2], *sLFE = s[3], *sSL = s[4], *sSR = s[5];
 | 
						const float *sFL = s[0], *sFR = s[1], *sFC = s[2], *sLFE = s[3], *sSL = s[4], *sSR = s[5];
 | 
				
			||||||
	float *dFL = d[0], *dFR = d[1], *dRL = d[2], *dRR = d[3];
 | 
						float *dFL = d[0], *dFR = d[1], *dRL = d[2], *dRR = d[3];
 | 
				
			||||||
| 
						 | 
					@ -363,16 +365,16 @@ channelmix_f32_5p1_4_sse(struct channelmix *mix, uint32_t n_dst, void * SPA_REST
 | 
				
			||||||
			ctr = _mm_add_ps(ctr, _mm_mul_ps(_mm_load_ps(&sLFE[n]), llev));
 | 
								ctr = _mm_add_ps(ctr, _mm_mul_ps(_mm_load_ps(&sLFE[n]), llev));
 | 
				
			||||||
			_mm_store_ps(&dFL[n], _mm_mul_ps(_mm_add_ps(_mm_load_ps(&sFL[n]), ctr), v0));
 | 
								_mm_store_ps(&dFL[n], _mm_mul_ps(_mm_add_ps(_mm_load_ps(&sFL[n]), ctr), v0));
 | 
				
			||||||
			_mm_store_ps(&dFR[n], _mm_mul_ps(_mm_add_ps(_mm_load_ps(&sFR[n]), ctr), v1));
 | 
								_mm_store_ps(&dFR[n], _mm_mul_ps(_mm_add_ps(_mm_load_ps(&sFR[n]), ctr), v1));
 | 
				
			||||||
			_mm_store_ps(&dRL[n], _mm_mul_ps(_mm_load_ps(&sSL[n]), v0));
 | 
								_mm_store_ps(&dRL[n], _mm_mul_ps(_mm_load_ps(&sSL[n]), v4));
 | 
				
			||||||
			_mm_store_ps(&dRR[n], _mm_mul_ps(_mm_load_ps(&sSR[n]), v1));
 | 
								_mm_store_ps(&dRR[n], _mm_mul_ps(_mm_load_ps(&sSR[n]), v5));
 | 
				
			||||||
		}
 | 
							}
 | 
				
			||||||
		for(; n < n_samples; n++) {
 | 
							for(; n < n_samples; n++) {
 | 
				
			||||||
			ctr = _mm_mul_ss(_mm_load_ss(&sFC[n]), clev);
 | 
								ctr = _mm_mul_ss(_mm_load_ss(&sFC[n]), clev);
 | 
				
			||||||
			ctr = _mm_add_ss(ctr, _mm_mul_ss(_mm_load_ss(&sLFE[n]), llev));
 | 
								ctr = _mm_add_ss(ctr, _mm_mul_ss(_mm_load_ss(&sLFE[n]), llev));
 | 
				
			||||||
			_mm_store_ss(&dFL[n], _mm_mul_ss(_mm_add_ss(_mm_load_ss(&sFL[n]), ctr), v0));
 | 
								_mm_store_ss(&dFL[n], _mm_mul_ss(_mm_add_ss(_mm_load_ss(&sFL[n]), ctr), v0));
 | 
				
			||||||
			_mm_store_ss(&dFR[n], _mm_mul_ss(_mm_add_ss(_mm_load_ss(&sFR[n]), ctr), v1));
 | 
								_mm_store_ss(&dFR[n], _mm_mul_ss(_mm_add_ss(_mm_load_ss(&sFR[n]), ctr), v1));
 | 
				
			||||||
			_mm_store_ss(&dRL[n], _mm_mul_ss(_mm_load_ss(&sSL[n]), v0));
 | 
								_mm_store_ss(&dRL[n], _mm_mul_ss(_mm_load_ss(&sSL[n]), v4));
 | 
				
			||||||
			_mm_store_ss(&dRR[n], _mm_mul_ss(_mm_load_ss(&sSR[n]), v1));
 | 
								_mm_store_ss(&dRR[n], _mm_mul_ss(_mm_load_ss(&sSR[n]), v5));
 | 
				
			||||||
		}
 | 
							}
 | 
				
			||||||
	}
 | 
						}
 | 
				
			||||||
}
 | 
					}
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue