/**************************************************************
 *
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 *
 *************************************************************/



// MARKER(update_precomp.py): autogen include statement, do not remove
#include "precompiled_bridges.hxx"

#include <stdio.h>
#include <stdlib.h>
#include <hash_map>

#include <rtl/alloc.h>
#include <osl/mutex.hxx>

#include <com/sun/star/uno/genfunc.hxx>
#include "com/sun/star/uno/RuntimeException.hpp"
#include <uno/data.h>
#include <typelib/typedescription.hxx>

#include "bridges/cpp_uno/shared/bridge.hxx"
#include "bridges/cpp_uno/shared/cppinterfaceproxy.hxx"
#include "bridges/cpp_uno/shared/types.hxx"
#include "bridges/cpp_uno/shared/vtablefactory.hxx"

#include "abi.hxx"
#include "share.hxx"

using namespace ::osl;
using namespace ::rtl;
using namespace ::com::sun::star::uno;

//==================================================================================================

// Perform the UNO call
//
// We must convert the parameters stored in gpreg, fpreg and ovrflw to UNO
// arguments and call pThis->getUnoI()->pDispatcher.
//
// gpreg:  this, [gpr params x0..x7]   (the indirect-result ptr is x8, separate)
// fpreg:  [fpr params d0..d7]
// ovrflw: [gpr or fpr params (properly aligned)]
//
// On AArch64 a structure bigger than 16 bytes is returned via the buffer
// addressed by x8 (pIndirectReturn); 'this' is always x0 = gpreg[0].
// Simple types are returned in x0,x1 (int) or d0,d1 (fp); HFAs in d0..d3;
// non-HFA structures <= 16 bytes in x0,x1.
static typelib_TypeClass cpp2uno_call(
	bridges::cpp_uno::shared::CppInterfaceProxy * pThis,
	const typelib_TypeDescription * pMemberTypeDescr,
	typelib_TypeDescriptionReference * pReturnTypeRef, // 0 indicates void return
	sal_Int32 nParams, typelib_MethodParameter * pParams,
	void ** gpreg, void ** fpreg, void ** ovrflw,
	void * pIndirectReturn, // AArch64 x8 indirect-result pointer (0 if none)
	sal_uInt64 * pRegisterReturn /* space for register return */ )
{
	unsigned int nr_gpr = 0; //number of gpr registers used
	unsigned int nr_fpr = 0; //number of fpr registers used

	// return
	typelib_TypeDescription * pReturnTypeDescr = 0;
	if (pReturnTypeRef)
		TYPELIB_DANGER_GET( &pReturnTypeDescr, pReturnTypeRef );

	void * pUnoReturn = 0;
	void * pCppReturn = 0; // complex return ptr: if != 0 && != pUnoReturn, reconversion need

	if ( pReturnTypeDescr )
	{
		if ( aarch64::return_in_hidden_param( pReturnTypeRef ) )
		{
			// AArch64: the indirect-result pointer arrives in x8, NOT in the
			// first general-purpose argument register (unlike x86-64 SysV).
			// So we take it from pIndirectReturn and do NOT consume a gpreg
			// slot here; 'this' still occupies gpreg[0] below.
			pCppReturn = pIndirectReturn;

			pUnoReturn = ( bridges::cpp_uno::shared::relatesToInterfaceType( pReturnTypeDescr )
						   ? alloca( pReturnTypeDescr->nSize )
						   : pCppReturn ); // direct way
		}
		else
			pUnoReturn = pRegisterReturn; // direct way for simple types
	}

	// pop this (x0)
	gpreg++;
	nr_gpr++;

	// stack space
	// parameters
	void ** pUnoArgs = reinterpret_cast<void **>(alloca( 4 * sizeof(void *) * nParams ));
	void ** pCppArgs = pUnoArgs + nParams;
	// indizes of values this have to be converted (interface conversion cpp<=>uno)
	sal_Int32 * pTempIndizes = reinterpret_cast<sal_Int32 *>(pUnoArgs + (2 * nParams));
	// type descriptions for reconversions
	typelib_TypeDescription ** ppTempParamTypeDescr = reinterpret_cast<typelib_TypeDescription **>(pUnoArgs + (3 * nParams));

	sal_Int32 nTempIndizes = 0;

	for ( sal_Int32 nPos = 0; nPos < nParams; ++nPos )
	{
		const typelib_MethodParameter & rParam = pParams[nPos];

		int nUsedGPR = 0;
		int nUsedFPR = 0;
		bool bFitsRegisters = aarch64::examine_argument( rParam.pTypeRef, false, nUsedGPR, nUsedFPR );
		if ( !rParam.bOut && bridges::cpp_uno::shared::isSimpleType( rParam.pTypeRef ) ) // value
		{
			// A simple UNO type occupies exactly one register, GPR or FPR.
			OSL_ASSERT( bFitsRegisters && ( ( nUsedFPR == 1 && nUsedGPR == 0 ) || ( nUsedFPR == 0 && nUsedGPR == 1 ) ) );

			if ( nUsedFPR == 1 )
			{
				if ( nr_fpr < aarch64::MAX_FPR_REGS )
				{
					pCppArgs[nPos] = pUnoArgs[nPos] = fpreg++;
					nr_fpr++;
				}
				else
					pCppArgs[nPos] = pUnoArgs[nPos] = ovrflw++;
			}
			else if ( nUsedGPR == 1 )
			{
				if ( nr_gpr < aarch64::MAX_GPR_REGS )
				{
					pCppArgs[nPos] = pUnoArgs[nPos] = gpreg++;
					nr_gpr++;
				}
				else
					pCppArgs[nPos] = pUnoArgs[nPos] = ovrflw++;
			}
		}
		else // struct <= 16 bytes || ptr to complex value || ref
		{
			typelib_TypeDescription * pParamTypeDescr = 0;
			TYPELIB_DANGER_GET( &pParamTypeDescr, rParam.pTypeRef );

			void *pCppStack;
			if ( nr_gpr < aarch64::MAX_GPR_REGS )
			{
				pCppArgs[nPos] = pCppStack = *gpreg++;
				nr_gpr++;
			}
			else
				pCppArgs[nPos] = pCppStack = *ovrflw++;

			if (! rParam.bIn) // is pure out
			{
				// uno out is unconstructed mem!
				pUnoArgs[nPos] = alloca( pParamTypeDescr->nSize );
				pTempIndizes[nTempIndizes] = nPos;
				// will be released at reconversion
				ppTempParamTypeDescr[nTempIndizes++] = pParamTypeDescr;
			}
			else if ( bridges::cpp_uno::shared::relatesToInterfaceType( pParamTypeDescr ) ) // is in/inout
			{
				uno_copyAndConvertData( pUnoArgs[nPos] = alloca( pParamTypeDescr->nSize ),
										pCppStack, pParamTypeDescr,
										pThis->getBridge()->getCpp2Uno() );
				pTempIndizes[nTempIndizes] = nPos; // has to be reconverted
				// will be released at reconversion
				ppTempParamTypeDescr[nTempIndizes++] = pParamTypeDescr;
			}
			else // direct way
			{
				pUnoArgs[nPos] = pCppStack;
				// no longer needed
				TYPELIB_DANGER_RELEASE( pParamTypeDescr );
			}
		}
	}

	// ExceptionHolder
	uno_Any aUnoExc; // Any will be constructed by callee
	uno_Any * pUnoExc = &aUnoExc;

	// invoke uno dispatch call
	(*pThis->getUnoI()->pDispatcher)( pThis->getUnoI(), pMemberTypeDescr, pUnoReturn, pUnoArgs, &pUnoExc );

	// in case an exception occurred...
	if ( pUnoExc )
	{
		// destruct temporary in/inout params
		for ( ; nTempIndizes--; )
		{
			sal_Int32 nIndex = pTempIndizes[nTempIndizes];

			if (pParams[nIndex].bIn) // is in/inout => was constructed
				uno_destructData( pUnoArgs[nIndex], ppTempParamTypeDescr[nTempIndizes], 0 );
			TYPELIB_DANGER_RELEASE( ppTempParamTypeDescr[nTempIndizes] );
		}
		if (pReturnTypeDescr)
			TYPELIB_DANGER_RELEASE( pReturnTypeDescr );

		CPPU_CURRENT_NAMESPACE::raiseException( &aUnoExc, pThis->getBridge()->getUno2Cpp() ); // has to destruct the any
		// is here for dummy
		return typelib_TypeClass_VOID;
	}
	else // else no exception occurred...
	{
		// temporary params
		for ( ; nTempIndizes--; )
		{
			sal_Int32 nIndex = pTempIndizes[nTempIndizes];
			typelib_TypeDescription * pParamTypeDescr = ppTempParamTypeDescr[nTempIndizes];

			if ( pParams[nIndex].bOut ) // inout/out
			{
				// convert and assign
				uno_destructData( pCppArgs[nIndex], pParamTypeDescr, cpp_release );
				uno_copyAndConvertData( pCppArgs[nIndex], pUnoArgs[nIndex], pParamTypeDescr,
										pThis->getBridge()->getUno2Cpp() );
			}
			// destroy temp uno param
			uno_destructData( pUnoArgs[nIndex], pParamTypeDescr, 0 );

			TYPELIB_DANGER_RELEASE( pParamTypeDescr );
		}
		// return
		if ( pCppReturn ) // has complex return
		{
			if ( pUnoReturn != pCppReturn ) // needs reconversion
			{
				uno_copyAndConvertData( pCppReturn, pUnoReturn, pReturnTypeDescr,
										pThis->getBridge()->getUno2Cpp() );
				// destroy temp uno return
				uno_destructData( pUnoReturn, pReturnTypeDescr, 0 );
			}
			// complex return ptr is set to return reg
			*reinterpret_cast<void **>(pRegisterReturn) = pCppReturn;
		}
		if ( pReturnTypeDescr )
		{
			typelib_TypeClass eRet = (typelib_TypeClass)pReturnTypeDescr->eTypeClass;
			TYPELIB_DANGER_RELEASE( pReturnTypeDescr );
			return eRet;
		}
		else
			return typelib_TypeClass_VOID;
	}
}


//==================================================================================================
extern "C" typelib_TypeClass cpp_vtable_call(
	sal_Int32 nFunctionIndex, sal_Int32 nVtableOffset,
	void ** gpreg, void ** fpreg, void ** ovrflw,
	void * pIndirectReturn, // AArch64 x8 indirect-result pointer (0 if none)
	sal_uInt64 * pRegisterReturn /* space for register return */ )
{
	// gpreg:  this, [other gpr params x0..x7]
	// fpreg:  [fpr params d0..d7]
	// ovrflw: [gpr or fpr params (properly aligned)]
	// pIndirectReturn: x8 (the hidden return buffer), when bit 0x80000000 set.
	//
	// On AArch64 'this' is ALWAYS x0 = gpreg[0]; the hidden return pointer is
	// the separate x8 register, not a displaced first GPR (unlike x86-64 SysV
	// where it occupied gpreg[0] and 'this' moved to gpreg[1]).
	if ( nFunctionIndex & 0x80000000 )
		nFunctionIndex &= 0x7fffffff;

	void * pThis = gpreg[0];
	pThis = static_cast<char *>( pThis ) - nVtableOffset;

	bridges::cpp_uno::shared::CppInterfaceProxy * pCppI =
		bridges::cpp_uno::shared::CppInterfaceProxy::castInterfaceToProxy( pThis );

	typelib_InterfaceTypeDescription * pTypeDescr = pCppI->getTypeDescr();

	OSL_ENSURE( nFunctionIndex < pTypeDescr->nMapFunctionIndexToMemberIndex, "### illegal vtable index!\n" );
	if ( nFunctionIndex >= pTypeDescr->nMapFunctionIndexToMemberIndex )
	{
		throw RuntimeException( OUString::createFromAscii("illegal vtable index!"),
								reinterpret_cast<XInterface *>( pCppI ) );
	}

	// determine called method
	sal_Int32 nMemberPos = pTypeDescr->pMapFunctionIndexToMemberIndex[nFunctionIndex];
	OSL_ENSURE( nMemberPos < pTypeDescr->nAllMembers, "### illegal member index!\n" );

	TypeDescription aMemberDescr( pTypeDescr->ppAllMembers[nMemberPos] );

	typelib_TypeClass eRet;
	switch ( aMemberDescr.get()->eTypeClass )
	{
		case typelib_TypeClass_INTERFACE_ATTRIBUTE:
		{
			typelib_TypeDescriptionReference *pAttrTypeRef =
				reinterpret_cast<typelib_InterfaceAttributeTypeDescription *>( aMemberDescr.get() )->pAttributeTypeRef;

			if ( pTypeDescr->pMapMemberIndexToFunctionIndex[nMemberPos] == nFunctionIndex )
			{
				// is GET method
				eRet = cpp2uno_call( pCppI, aMemberDescr.get(), pAttrTypeRef,
						0, 0, // no params
						gpreg, fpreg, ovrflw, pIndirectReturn, pRegisterReturn );
			}
			else
			{
				// is SET method
				typelib_MethodParameter aParam;
				aParam.pTypeRef = pAttrTypeRef;
				aParam.bIn		= sal_True;
				aParam.bOut		= sal_False;

				eRet = cpp2uno_call( pCppI, aMemberDescr.get(),
						0, // indicates void return
						1, &aParam,
						gpreg, fpreg, ovrflw, pIndirectReturn, pRegisterReturn );
			}
			break;
		}
		case typelib_TypeClass_INTERFACE_METHOD:
		{
			// is METHOD
			switch ( nFunctionIndex )
			{
				case 1: // acquire()
					pCppI->acquireProxy(); // non virtual call!
					eRet = typelib_TypeClass_VOID;
					break;
				case 2: // release()
					pCppI->releaseProxy(); // non virtual call!
					eRet = typelib_TypeClass_VOID;
					break;
				case 0: // queryInterface() opt
				{
					// queryInterface([in] type) returns an Any (> 16 bytes),
					// so on AArch64 the result buffer is x8 (pIndirectReturn),
					// 'this' is gpreg[0], and the type argument is the first
					// real parameter, gpreg[1].
					typelib_TypeDescription * pTD = 0;
					TYPELIB_DANGER_GET( &pTD, reinterpret_cast<Type *>( gpreg[1] )->getTypeLibType() );
					if ( pTD )
					{
						XInterface * pInterface = 0;
						(*pCppI->getBridge()->getCppEnv()->getRegisteredInterface)
							( pCppI->getBridge()->getCppEnv(),
							  reinterpret_cast<void **>(&pInterface),
							  pCppI->getOid().pData,
							  reinterpret_cast<typelib_InterfaceTypeDescription *>( pTD ) );

						if ( pInterface )
						{
							::uno_any_construct( reinterpret_cast<uno_Any *>( pIndirectReturn ),
												 &pInterface, pTD, cpp_acquire );

							pInterface->release();
							TYPELIB_DANGER_RELEASE( pTD );

							reinterpret_cast<void **>( pRegisterReturn )[0] = pIndirectReturn;
							eRet = typelib_TypeClass_ANY;
							break;
						}
						TYPELIB_DANGER_RELEASE( pTD );
					}
				} // else perform queryInterface()
				default:
				{
					typelib_InterfaceMethodTypeDescription *pMethodTD =
						reinterpret_cast<typelib_InterfaceMethodTypeDescription *>( aMemberDescr.get() );

					eRet = cpp2uno_call( pCppI, aMemberDescr.get(),
										 pMethodTD->pReturnTypeRef,
										 pMethodTD->nParams,
										 pMethodTD->pParams,
										 gpreg, fpreg, ovrflw, pIndirectReturn, pRegisterReturn );
				}
			}
			break;
		}
		default:
		{
			throw RuntimeException( OUString::createFromAscii("no member description found!"),
									reinterpret_cast<XInterface *>( pCppI ) );
			// is here for dummy
			eRet = typelib_TypeClass_VOID;
		}
	}

	return eRet;
}

//==================================================================================================
// The incoming register-spill executor, implemented in call.s.  It is reached
// via BR from a per-slot snippet (codeSnippet below) with x16 carrying the
// packed (nVtableOffset << 32) | nFunctionIndex; it spills the argument
// registers and calls cpp_vtable_call.
extern "C" void privateSnippetExecutor( void );

// Each snippet is 5 AArch64 instructions (20 bytes) + 4 bytes padding to an
// 8-byte boundary + two 8-byte literals (the packed index and the executor
// address) = 40 bytes.
const int codeSnippetSize = 40;

// Generate a per-vtable-slot trampoline that loads the packed function index
// into x16 and branches to privateSnippetExecutor(), preserving every
// argument register.  Uses PC-relative literal loads because AArch64 cannot
// embed a 64-bit immediate in a single instruction.
//
// Layout (offsets in bytes from code):
//    0:  ldr  x16, #24      ; x16 = nOffsetAndIndex (literal at +24)
//    4:  ldr  x17, #28      ; x17 = privateSnippetExecutor (literal at +32)
//    8:  br   x17
//   12:  (unused / padding)
//   16:  (padding to 8-byte align the literals at 24)
//   24:  .quad nOffsetAndIndex
//   32:  .quad privateSnippetExecutor
//
// Note: the snippet creates no stack frame, so the C++ unwinder walks straight
// through it to the original caller (required for UNO exception propagation).
unsigned char * codeSnippet( unsigned char * code,
        sal_Int32 nFunctionIndex, sal_Int32 nVtableOffset,
        bool bHasHiddenParam ) SAL_THROW( () )
{
	sal_uInt64 nOffsetAndIndex = ( static_cast<sal_uInt64>( nVtableOffset ) << 32 ) | static_cast<sal_uInt64>( nFunctionIndex );

	if ( bHasHiddenParam )
		nOffsetAndIndex |= 0x80000000;

	sal_uInt32 * p = reinterpret_cast<sal_uInt32 *>( code );

	// ldr x16, #24  -> literal at code+24. imm19 = 24/4 = 6.
	//   encoding: 0x58000000 | (imm19 << 5) | Rt(16)
	p[0] = 0x58000000 | ( 6 << 5 ) | 16;
	// ldr x17, #28  -> literal at code+32 (relative to this insn at +4): 28.
	//   imm19 = 28/4 = 7.
	p[1] = 0x58000000 | ( 7 << 5 ) | 17;
	// br x17  -> 0xD61F0000 | (Rn(17) << 5)
	p[2] = 0xD61F0000 | ( 17 << 5 );
	// p[3] (offset 12) and p[4] (offset 16..20) are padding.
	p[3] = 0xD503201F; // NOP
	p[4] = 0xD503201F; // NOP

	// literals, 8-byte aligned at offset 24 and 32
	*reinterpret_cast<sal_uInt64 *>( code + 24 ) = nOffsetAndIndex;
	*reinterpret_cast<sal_uInt64 *>( code + 32 ) = reinterpret_cast<sal_uInt64>( privateSnippetExecutor );

	return code + codeSnippetSize;
}

//==================================================================================================
struct bridges::cpp_uno::shared::VtableFactory::Slot { void * fn; };

bridges::cpp_uno::shared::VtableFactory::Slot *
bridges::cpp_uno::shared::VtableFactory::mapBlockToVtable(void * block)
{
    return static_cast< Slot * >(block) + 2;
}

//==================================================================================================
sal_Size bridges::cpp_uno::shared::VtableFactory::getBlockSize(
    sal_Int32 slotCount)
{
    return (slotCount + 2) * sizeof (Slot) + slotCount * codeSnippetSize;
}

//==================================================================================================
bridges::cpp_uno::shared::VtableFactory::Slot *
bridges::cpp_uno::shared::VtableFactory::initializeBlock(
    void * block, sal_Int32 slotCount)
{
    Slot * slots = mapBlockToVtable(block);
    slots[-2].fn = 0;
    slots[-1].fn = 0;
    return slots + slotCount;
}

//==================================================================================================

unsigned char * bridges::cpp_uno::shared::VtableFactory::addLocalFunctions(
	Slot ** slots, unsigned char * code, /*sal_PtrDiff writetoexecdiff,*/
	typelib_InterfaceTypeDescription const * type, sal_Int32 nFunctionOffset,
	sal_Int32 functionCount, sal_Int32 nVtableOffset )
{
	const sal_PtrDiff writetoexecdiff = 0;
	(*slots) -= functionCount;
	Slot * s = *slots;
	for ( sal_Int32 nPos = 0; nPos < type->nMembers; ++nPos )
	{
		typelib_TypeDescription * pTD = 0;

		TYPELIB_DANGER_GET( &pTD, type->ppMembers[ nPos ] );
		OSL_ASSERT( pTD );

		if ( typelib_TypeClass_INTERFACE_ATTRIBUTE == pTD->eTypeClass )
		{
			typelib_InterfaceAttributeTypeDescription *pAttrTD =
				reinterpret_cast<typelib_InterfaceAttributeTypeDescription *>( pTD );

			// get method
			(s++)->fn = code + writetoexecdiff;
			code = codeSnippet( code, nFunctionOffset++, nVtableOffset,
								aarch64::return_in_hidden_param( pAttrTD->pAttributeTypeRef ) );

			if ( ! pAttrTD->bReadOnly )
			{
				// set method
				(s++)->fn = code + writetoexecdiff;
				code = codeSnippet( code, nFunctionOffset++, nVtableOffset, false );
			}
		}
		else if ( typelib_TypeClass_INTERFACE_METHOD == pTD->eTypeClass )
		{
			typelib_InterfaceMethodTypeDescription *pMethodTD =
				reinterpret_cast<typelib_InterfaceMethodTypeDescription *>( pTD );

			(s++)->fn = code + writetoexecdiff;
			code = codeSnippet( code, nFunctionOffset++, nVtableOffset,
								aarch64::return_in_hidden_param( pMethodTD->pReturnTypeRef ) );
		}
		else
			OSL_ASSERT( false );

		TYPELIB_DANGER_RELEASE( pTD );
	}
	return code;
}

//==================================================================================================
void bridges::cpp_uno::shared::VtableFactory::flushCode(
	unsigned char const *, unsigned char const * )
{
}
