diff --git a/codegen/annotations.h b/codegen/annotations.h index ec01285..af503c9 100644 --- a/codegen/annotations.h +++ b/codegen/annotations.h @@ -5536,13 +5536,13 @@ cudaError_t cudaMemcpyFromSymbolAsync(void *dst, const void *symbol, enum cudaMemcpyKind kind, cudaStream_t stream); /** - * @param devPtr SEND_RECV + * @param devPtr SEND_ONLY * @param value SEND_ONLY * @param count SEND_ONLY */ cudaError_t cudaMemset(void *devPtr, int value, size_t count); /** - * @param devPtr SEND_RECV + * @param devPtr SEND_ONLY * @param pitch SEND_ONLY * @param value SEND_ONLY * @param width SEND_ONLY @@ -5558,7 +5558,7 @@ cudaError_t cudaMemset2D(void *devPtr, size_t pitch, int value, size_t width, cudaError_t cudaMemset3D(struct cudaPitchedPtr pitchedDevPtr, int value, struct cudaExtent extent); /** - * @param devPtr SEND_RECV + * @param devPtr SEND_ONLY * @param value SEND_ONLY * @param count SEND_ONLY * @param stream SEND_ONLY @@ -5566,7 +5566,7 @@ cudaError_t cudaMemset3D(struct cudaPitchedPtr pitchedDevPtr, int value, cudaError_t cudaMemsetAsync(void *devPtr, int value, size_t count, cudaStream_t stream); /** - * @param devPtr SEND_RECV + * @param devPtr SEND_ONLY * @param pitch SEND_ONLY * @param value SEND_ONLY * @param width SEND_ONLY diff --git a/codegen/gen_api.h b/codegen/gen_api.h index 2545cf2..08901ce 100644 --- a/codegen/gen_api.h +++ b/codegen/gen_api.h @@ -768,644 +768,648 @@ #define RPC_cudaMemcpyAsync 767 #define RPC_cudaMemcpy2DToArrayAsync 768 #define RPC_cudaMemcpyToSymbolAsync 769 -#define RPC_cudaMemset3D 770 -#define RPC_cudaMemset3DAsync 771 -#define RPC_cudaGetSymbolAddress 772 -#define RPC_cudaGetSymbolSize 773 -#define RPC_cudaMemPrefetchAsync 774 -#define RPC_cudaMemAdvise 775 -#define RPC_cudaMemRangeGetAttributes 776 -#define RPC_cudaMemcpyToArray 777 -#define RPC_cudaMemcpyArrayToArray 778 -#define RPC_cudaMemcpyToArrayAsync 779 -#define RPC_cudaMallocAsync 780 -#define RPC_cudaMemPoolTrimTo 781 -#define RPC_cudaMemPoolSetAccess 782 -#define RPC_cudaMemPoolGetAccess 783 -#define RPC_cudaMemPoolCreate 784 -#define RPC_cudaMemPoolDestroy 785 -#define RPC_cudaMallocFromPoolAsync 786 -#define RPC_cudaMemPoolImportPointer 787 -#define RPC_cudaPointerGetAttributes 788 -#define RPC_cudaDeviceCanAccessPeer 789 -#define RPC_cudaDeviceEnablePeerAccess 790 -#define RPC_cudaDeviceDisablePeerAccess 791 -#define RPC_cudaGraphicsUnregisterResource 792 -#define RPC_cudaGraphicsResourceSetMapFlags 793 -#define RPC_cudaGraphicsMapResources 794 -#define RPC_cudaGraphicsUnmapResources 795 -#define RPC_cudaGraphicsResourceGetMappedPointer 796 -#define RPC_cudaGraphicsSubResourceGetMappedArray 797 -#define RPC_cudaGraphicsResourceGetMappedMipmappedArray 798 -#define RPC_cudaGetChannelDesc 799 -#define RPC_cudaCreateChannelDesc 800 -#define RPC_cudaCreateTextureObject 801 -#define RPC_cudaDestroyTextureObject 802 -#define RPC_cudaGetTextureObjectResourceDesc 803 -#define RPC_cudaGetTextureObjectTextureDesc 804 -#define RPC_cudaGetTextureObjectResourceViewDesc 805 -#define RPC_cudaCreateSurfaceObject 806 -#define RPC_cudaDestroySurfaceObject 807 -#define RPC_cudaGetSurfaceObjectResourceDesc 808 -#define RPC_cudaDriverGetVersion 809 -#define RPC_cudaRuntimeGetVersion 810 -#define RPC_cudaGraphCreate 811 -#define RPC_cudaGraphAddKernelNode 812 -#define RPC_cudaGraphKernelNodeGetParams 813 -#define RPC_cudaGraphKernelNodeSetParams 814 -#define RPC_cudaGraphKernelNodeCopyAttributes 815 -#define RPC_cudaGraphKernelNodeGetAttribute 816 -#define RPC_cudaGraphKernelNodeSetAttribute 817 -#define RPC_cudaGraphAddMemcpyNode 818 -#define RPC_cudaGraphAddMemcpyNodeToSymbol 819 -#define RPC_cudaGraphMemcpyNodeGetParams 820 -#define RPC_cudaGraphMemcpyNodeSetParams 821 -#define RPC_cudaGraphMemcpyNodeSetParamsToSymbol 822 -#define RPC_cudaGraphAddMemsetNode 823 -#define RPC_cudaGraphMemsetNodeGetParams 824 -#define RPC_cudaGraphMemsetNodeSetParams 825 -#define RPC_cudaGraphAddHostNode 826 -#define RPC_cudaGraphHostNodeGetParams 827 -#define RPC_cudaGraphHostNodeSetParams 828 -#define RPC_cudaGraphAddChildGraphNode 829 -#define RPC_cudaGraphChildGraphNodeGetGraph 830 -#define RPC_cudaGraphAddEmptyNode 831 -#define RPC_cudaGraphAddEventRecordNode 832 -#define RPC_cudaGraphEventRecordNodeGetEvent 833 -#define RPC_cudaGraphEventRecordNodeSetEvent 834 -#define RPC_cudaGraphAddEventWaitNode 835 -#define RPC_cudaGraphEventWaitNodeGetEvent 836 -#define RPC_cudaGraphEventWaitNodeSetEvent 837 -#define RPC_cudaGraphAddExternalSemaphoresSignalNode 838 -#define RPC_cudaGraphExternalSemaphoresSignalNodeGetParams 839 -#define RPC_cudaGraphExternalSemaphoresSignalNodeSetParams 840 -#define RPC_cudaGraphAddExternalSemaphoresWaitNode 841 -#define RPC_cudaGraphExternalSemaphoresWaitNodeGetParams 842 -#define RPC_cudaGraphExternalSemaphoresWaitNodeSetParams 843 -#define RPC_cudaGraphAddMemAllocNode 844 -#define RPC_cudaGraphMemAllocNodeGetParams 845 -#define RPC_cudaDeviceGraphMemTrim 846 -#define RPC_cudaGraphClone 847 -#define RPC_cudaGraphNodeFindInClone 848 -#define RPC_cudaGraphNodeGetType 849 -#define RPC_cudaGraphGetNodes 850 -#define RPC_cudaGraphGetRootNodes 851 -#define RPC_cudaGraphGetEdges 852 -#define RPC_cudaGraphNodeGetDependencies 853 -#define RPC_cudaGraphNodeGetDependentNodes 854 -#define RPC_cudaGraphAddDependencies 855 -#define RPC_cudaGraphRemoveDependencies 856 -#define RPC_cudaGraphDestroyNode 857 -#define RPC_cudaGraphInstantiate 858 -#define RPC_cudaGraphInstantiateWithFlags 859 -#define RPC_cudaGraphInstantiateWithParams 860 -#define RPC_cudaGraphExecGetFlags 861 -#define RPC_cudaGraphExecKernelNodeSetParams 862 -#define RPC_cudaGraphExecMemcpyNodeSetParams 863 -#define RPC_cudaGraphExecMemcpyNodeSetParamsToSymbol 864 -#define RPC_cudaGraphExecMemsetNodeSetParams 865 -#define RPC_cudaGraphExecHostNodeSetParams 866 -#define RPC_cudaGraphExecChildGraphNodeSetParams 867 -#define RPC_cudaGraphExecEventRecordNodeSetEvent 868 -#define RPC_cudaGraphExecEventWaitNodeSetEvent 869 -#define RPC_cudaGraphExecExternalSemaphoresSignalNodeSetParams 870 -#define RPC_cudaGraphExecExternalSemaphoresWaitNodeSetParams 871 -#define RPC_cudaGraphNodeSetEnabled 872 -#define RPC_cudaGraphNodeGetEnabled 873 -#define RPC_cudaGraphExecUpdate 874 -#define RPC_cudaGraphUpload 875 -#define RPC_cudaGraphLaunch 876 -#define RPC_cudaGraphExecDestroy 877 -#define RPC_cudaGraphDestroy 878 -#define RPC_cudaGraphDebugDotPrint 879 -#define RPC_cudaUserObjectRetain 880 -#define RPC_cudaUserObjectRelease 881 -#define RPC_cudaGraphRetainUserObject 882 -#define RPC_cudaGraphReleaseUserObject 883 -#define RPC_cudaGetDriverEntryPoint 884 -#define RPC_cudaGetExportTable 885 -#define RPC_cudaGetFuncBySymbol 886 -#define RPC_cublasCreate_v2 887 -#define RPC_cublasDestroy_v2 888 -#define RPC_cublasGetVersion_v2 889 -#define RPC_cublasGetProperty 890 -#define RPC_cublasGetCudartVersion 891 -#define RPC_cublasSetStream_v2 892 -#define RPC_cublasGetStream_v2 893 -#define RPC_cublasGetPointerMode_v2 894 -#define RPC_cublasSetPointerMode_v2 895 -#define RPC_cublasGetAtomicsMode 896 -#define RPC_cublasSetAtomicsMode 897 -#define RPC_cublasGetMathMode 898 -#define RPC_cublasSetMathMode 899 -#define RPC_cublasGetSmCountTarget 900 -#define RPC_cublasSetSmCountTarget 901 -#define RPC_cublasGetStatusName 902 -#define RPC_cublasGetStatusString 903 -#define RPC_cublasLoggerConfigure 904 -#define RPC_cublasSetLoggerCallback 905 -#define RPC_cublasGetLoggerCallback 906 -#define RPC_cublasXerbla 907 -#define RPC_cublasSnrm2_v2 908 -#define RPC_cublasSnrm2_v2_64 909 -#define RPC_cublasDnrm2_v2 910 -#define RPC_cublasDnrm2_v2_64 911 -#define RPC_cublasScnrm2_v2 912 -#define RPC_cublasScnrm2_v2_64 913 -#define RPC_cublasDznrm2_v2 914 -#define RPC_cublasDznrm2_v2_64 915 -#define RPC_cublasSdot_v2 916 -#define RPC_cublasSdot_v2_64 917 -#define RPC_cublasDdot_v2 918 -#define RPC_cublasDdot_v2_64 919 -#define RPC_cublasCdotu_v2 920 -#define RPC_cublasCdotu_v2_64 921 -#define RPC_cublasCdotc_v2 922 -#define RPC_cublasCdotc_v2_64 923 -#define RPC_cublasZdotu_v2 924 -#define RPC_cublasZdotu_v2_64 925 -#define RPC_cublasZdotc_v2 926 -#define RPC_cublasZdotc_v2_64 927 -#define RPC_cublasSscal_v2 928 -#define RPC_cublasSscal_v2_64 929 -#define RPC_cublasDscal_v2 930 -#define RPC_cublasDscal_v2_64 931 -#define RPC_cublasCscal_v2 932 -#define RPC_cublasCscal_v2_64 933 -#define RPC_cublasCsscal_v2 934 -#define RPC_cublasCsscal_v2_64 935 -#define RPC_cublasZscal_v2 936 -#define RPC_cublasZscal_v2_64 937 -#define RPC_cublasZdscal_v2 938 -#define RPC_cublasZdscal_v2_64 939 -#define RPC_cublasSaxpy_v2 940 -#define RPC_cublasSaxpy_v2_64 941 -#define RPC_cublasDaxpy_v2 942 -#define RPC_cublasDaxpy_v2_64 943 -#define RPC_cublasCaxpy_v2 944 -#define RPC_cublasCaxpy_v2_64 945 -#define RPC_cublasZaxpy_v2 946 -#define RPC_cublasZaxpy_v2_64 947 -#define RPC_cublasScopy_v2 948 -#define RPC_cublasScopy_v2_64 949 -#define RPC_cublasDcopy_v2 950 -#define RPC_cublasDcopy_v2_64 951 -#define RPC_cublasCcopy_v2 952 -#define RPC_cublasCcopy_v2_64 953 -#define RPC_cublasZcopy_v2 954 -#define RPC_cublasZcopy_v2_64 955 -#define RPC_cublasSswap_v2 956 -#define RPC_cublasSswap_v2_64 957 -#define RPC_cublasDswap_v2 958 -#define RPC_cublasDswap_v2_64 959 -#define RPC_cublasCswap_v2 960 -#define RPC_cublasCswap_v2_64 961 -#define RPC_cublasZswap_v2 962 -#define RPC_cublasZswap_v2_64 963 -#define RPC_cublasIsamax_v2 964 -#define RPC_cublasIsamax_v2_64 965 -#define RPC_cublasIdamax_v2 966 -#define RPC_cublasIdamax_v2_64 967 -#define RPC_cublasIcamax_v2 968 -#define RPC_cublasIcamax_v2_64 969 -#define RPC_cublasIzamax_v2 970 -#define RPC_cublasIzamax_v2_64 971 -#define RPC_cublasIamaxEx 972 -#define RPC_cublasIamaxEx_64 973 -#define RPC_cublasIsamin_v2 974 -#define RPC_cublasIsamin_v2_64 975 -#define RPC_cublasIdamin_v2 976 -#define RPC_cublasIdamin_v2_64 977 -#define RPC_cublasIcamin_v2 978 -#define RPC_cublasIcamin_v2_64 979 -#define RPC_cublasIzamin_v2 980 -#define RPC_cublasIzamin_v2_64 981 -#define RPC_cublasIaminEx 982 -#define RPC_cublasIaminEx_64 983 -#define RPC_cublasSasum_v2 984 -#define RPC_cublasSasum_v2_64 985 -#define RPC_cublasDasum_v2 986 -#define RPC_cublasDasum_v2_64 987 -#define RPC_cublasScasum_v2 988 -#define RPC_cublasScasum_v2_64 989 -#define RPC_cublasDzasum_v2 990 -#define RPC_cublasDzasum_v2_64 991 -#define RPC_cublasSrot_v2 992 -#define RPC_cublasSrot_v2_64 993 -#define RPC_cublasDrot_v2 994 -#define RPC_cublasDrot_v2_64 995 -#define RPC_cublasCrot_v2 996 -#define RPC_cublasCrot_v2_64 997 -#define RPC_cublasCsrot_v2 998 -#define RPC_cublasCsrot_v2_64 999 -#define RPC_cublasZrot_v2 1000 -#define RPC_cublasZrot_v2_64 1001 -#define RPC_cublasZdrot_v2 1002 -#define RPC_cublasZdrot_v2_64 1003 -#define RPC_cublasSrotg_v2 1004 -#define RPC_cublasDrotg_v2 1005 -#define RPC_cublasCrotg_v2 1006 -#define RPC_cublasZrotg_v2 1007 -#define RPC_cublasSrotm_v2 1008 -#define RPC_cublasSrotm_v2_64 1009 -#define RPC_cublasDrotm_v2 1010 -#define RPC_cublasDrotm_v2_64 1011 -#define RPC_cublasSrotmg_v2 1012 -#define RPC_cublasDrotmg_v2 1013 -#define RPC_cublasSgemv_v2 1014 -#define RPC_cublasSgemv_v2_64 1015 -#define RPC_cublasDgemv_v2 1016 -#define RPC_cublasDgemv_v2_64 1017 -#define RPC_cublasCgemv_v2 1018 -#define RPC_cublasCgemv_v2_64 1019 -#define RPC_cublasZgemv_v2 1020 -#define RPC_cublasZgemv_v2_64 1021 -#define RPC_cublasSgbmv_v2 1022 -#define RPC_cublasSgbmv_v2_64 1023 -#define RPC_cublasDgbmv_v2 1024 -#define RPC_cublasDgbmv_v2_64 1025 -#define RPC_cublasCgbmv_v2 1026 -#define RPC_cublasCgbmv_v2_64 1027 -#define RPC_cublasZgbmv_v2 1028 -#define RPC_cublasZgbmv_v2_64 1029 -#define RPC_cublasStrmv_v2 1030 -#define RPC_cublasStrmv_v2_64 1031 -#define RPC_cublasDtrmv_v2 1032 -#define RPC_cublasDtrmv_v2_64 1033 -#define RPC_cublasCtrmv_v2 1034 -#define RPC_cublasCtrmv_v2_64 1035 -#define RPC_cublasZtrmv_v2 1036 -#define RPC_cublasZtrmv_v2_64 1037 -#define RPC_cublasStbmv_v2 1038 -#define RPC_cublasStbmv_v2_64 1039 -#define RPC_cublasDtbmv_v2 1040 -#define RPC_cublasDtbmv_v2_64 1041 -#define RPC_cublasCtbmv_v2 1042 -#define RPC_cublasCtbmv_v2_64 1043 -#define RPC_cublasZtbmv_v2 1044 -#define RPC_cublasZtbmv_v2_64 1045 -#define RPC_cublasStpmv_v2 1046 -#define RPC_cublasStpmv_v2_64 1047 -#define RPC_cublasDtpmv_v2 1048 -#define RPC_cublasDtpmv_v2_64 1049 -#define RPC_cublasCtpmv_v2 1050 -#define RPC_cublasCtpmv_v2_64 1051 -#define RPC_cublasZtpmv_v2 1052 -#define RPC_cublasZtpmv_v2_64 1053 -#define RPC_cublasStrsv_v2 1054 -#define RPC_cublasStrsv_v2_64 1055 -#define RPC_cublasDtrsv_v2 1056 -#define RPC_cublasDtrsv_v2_64 1057 -#define RPC_cublasCtrsv_v2 1058 -#define RPC_cublasCtrsv_v2_64 1059 -#define RPC_cublasZtrsv_v2 1060 -#define RPC_cublasZtrsv_v2_64 1061 -#define RPC_cublasStpsv_v2 1062 -#define RPC_cublasStpsv_v2_64 1063 -#define RPC_cublasDtpsv_v2 1064 -#define RPC_cublasDtpsv_v2_64 1065 -#define RPC_cublasCtpsv_v2 1066 -#define RPC_cublasCtpsv_v2_64 1067 -#define RPC_cublasZtpsv_v2 1068 -#define RPC_cublasZtpsv_v2_64 1069 -#define RPC_cublasStbsv_v2 1070 -#define RPC_cublasStbsv_v2_64 1071 -#define RPC_cublasDtbsv_v2 1072 -#define RPC_cublasDtbsv_v2_64 1073 -#define RPC_cublasCtbsv_v2 1074 -#define RPC_cublasCtbsv_v2_64 1075 -#define RPC_cublasZtbsv_v2 1076 -#define RPC_cublasZtbsv_v2_64 1077 -#define RPC_cublasSsymv_v2 1078 -#define RPC_cublasSsymv_v2_64 1079 -#define RPC_cublasDsymv_v2 1080 -#define RPC_cublasDsymv_v2_64 1081 -#define RPC_cublasCsymv_v2 1082 -#define RPC_cublasCsymv_v2_64 1083 -#define RPC_cublasZsymv_v2 1084 -#define RPC_cublasZsymv_v2_64 1085 -#define RPC_cublasChemv_v2 1086 -#define RPC_cublasChemv_v2_64 1087 -#define RPC_cublasZhemv_v2 1088 -#define RPC_cublasZhemv_v2_64 1089 -#define RPC_cublasSsbmv_v2 1090 -#define RPC_cublasSsbmv_v2_64 1091 -#define RPC_cublasDsbmv_v2 1092 -#define RPC_cublasDsbmv_v2_64 1093 -#define RPC_cublasChbmv_v2 1094 -#define RPC_cublasChbmv_v2_64 1095 -#define RPC_cublasZhbmv_v2 1096 -#define RPC_cublasZhbmv_v2_64 1097 -#define RPC_cublasSspmv_v2 1098 -#define RPC_cublasSspmv_v2_64 1099 -#define RPC_cublasDspmv_v2 1100 -#define RPC_cublasDspmv_v2_64 1101 -#define RPC_cublasChpmv_v2 1102 -#define RPC_cublasChpmv_v2_64 1103 -#define RPC_cublasZhpmv_v2 1104 -#define RPC_cublasZhpmv_v2_64 1105 -#define RPC_cublasSger_v2 1106 -#define RPC_cublasSger_v2_64 1107 -#define RPC_cublasDger_v2 1108 -#define RPC_cublasDger_v2_64 1109 -#define RPC_cublasCgeru_v2 1110 -#define RPC_cublasCgeru_v2_64 1111 -#define RPC_cublasCgerc_v2 1112 -#define RPC_cublasCgerc_v2_64 1113 -#define RPC_cublasZgeru_v2 1114 -#define RPC_cublasZgeru_v2_64 1115 -#define RPC_cublasZgerc_v2 1116 -#define RPC_cublasZgerc_v2_64 1117 -#define RPC_cublasSsyr_v2 1118 -#define RPC_cublasSsyr_v2_64 1119 -#define RPC_cublasDsyr_v2 1120 -#define RPC_cublasDsyr_v2_64 1121 -#define RPC_cublasCsyr_v2 1122 -#define RPC_cublasCsyr_v2_64 1123 -#define RPC_cublasZsyr_v2 1124 -#define RPC_cublasZsyr_v2_64 1125 -#define RPC_cublasCher_v2 1126 -#define RPC_cublasCher_v2_64 1127 -#define RPC_cublasZher_v2 1128 -#define RPC_cublasZher_v2_64 1129 -#define RPC_cublasSspr_v2 1130 -#define RPC_cublasSspr_v2_64 1131 -#define RPC_cublasDspr_v2 1132 -#define RPC_cublasDspr_v2_64 1133 -#define RPC_cublasChpr_v2 1134 -#define RPC_cublasChpr_v2_64 1135 -#define RPC_cublasZhpr_v2 1136 -#define RPC_cublasZhpr_v2_64 1137 -#define RPC_cublasSsyr2_v2 1138 -#define RPC_cublasSsyr2_v2_64 1139 -#define RPC_cublasDsyr2_v2 1140 -#define RPC_cublasDsyr2_v2_64 1141 -#define RPC_cublasCsyr2_v2 1142 -#define RPC_cublasCsyr2_v2_64 1143 -#define RPC_cublasZsyr2_v2 1144 -#define RPC_cublasZsyr2_v2_64 1145 -#define RPC_cublasCher2_v2 1146 -#define RPC_cublasCher2_v2_64 1147 -#define RPC_cublasZher2_v2 1148 -#define RPC_cublasZher2_v2_64 1149 -#define RPC_cublasSspr2_v2 1150 -#define RPC_cublasSspr2_v2_64 1151 -#define RPC_cublasDspr2_v2 1152 -#define RPC_cublasDspr2_v2_64 1153 -#define RPC_cublasChpr2_v2 1154 -#define RPC_cublasChpr2_v2_64 1155 -#define RPC_cublasZhpr2_v2 1156 -#define RPC_cublasZhpr2_v2_64 1157 -#define RPC_cublasSgemvBatched 1158 -#define RPC_cublasTSTgemvBatched 1159 -#define RPC_cublasSgemvStridedBatched 1160 -#define RPC_cublasSgemvStridedBatched_64 1161 -#define RPC_cublasDgemvStridedBatched 1162 -#define RPC_cublasDgemvStridedBatched_64 1163 -#define RPC_cublasCgemvStridedBatched 1164 -#define RPC_cublasCgemvStridedBatched_64 1165 -#define RPC_cublasZgemvStridedBatched 1166 -#define RPC_cublasZgemvStridedBatched_64 1167 -#define RPC_cublasHSHgemvStridedBatched 1168 -#define RPC_cublasHSHgemvStridedBatched_64 1169 -#define RPC_cublasHSSgemvStridedBatched 1170 -#define RPC_cublasHSSgemvStridedBatched_64 1171 -#define RPC_cublasTSTgemvStridedBatched 1172 -#define RPC_cublasTSTgemvStridedBatched_64 1173 -#define RPC_cublasTSSgemvStridedBatched 1174 -#define RPC_cublasTSSgemvStridedBatched_64 1175 -#define RPC_cublasSgemm_v2 1176 -#define RPC_cublasSgemm_v2_64 1177 -#define RPC_cublasDgemm_v2 1178 -#define RPC_cublasDgemm_v2_64 1179 -#define RPC_cublasCgemm_v2 1180 -#define RPC_cublasCgemm_v2_64 1181 -#define RPC_cublasCgemm3m 1182 -#define RPC_cublasCgemm3m_64 1183 -#define RPC_cublasZgemm_v2 1184 -#define RPC_cublasZgemm_v2_64 1185 -#define RPC_cublasZgemm3m 1186 -#define RPC_cublasZgemm3m_64 1187 -#define RPC_cublasHgemm 1188 -#define RPC_cublasHgemm_64 1189 -#define RPC_cublasSsyrk_v2 1190 -#define RPC_cublasSsyrk_v2_64 1191 -#define RPC_cublasDsyrk_v2 1192 -#define RPC_cublasDsyrk_v2_64 1193 -#define RPC_cublasCsyrk_v2 1194 -#define RPC_cublasCsyrk_v2_64 1195 -#define RPC_cublasZsyrk_v2 1196 -#define RPC_cublasZsyrk_v2_64 1197 -#define RPC_cublasCherk_v2 1198 -#define RPC_cublasCherk_v2_64 1199 -#define RPC_cublasZherk_v2 1200 -#define RPC_cublasZherk_v2_64 1201 -#define RPC_cublasSsyr2k_v2 1202 -#define RPC_cublasSsyr2k_v2_64 1203 -#define RPC_cublasDsyr2k_v2 1204 -#define RPC_cublasDsyr2k_v2_64 1205 -#define RPC_cublasCsyr2k_v2 1206 -#define RPC_cublasCsyr2k_v2_64 1207 -#define RPC_cublasZsyr2k_v2 1208 -#define RPC_cublasZsyr2k_v2_64 1209 -#define RPC_cublasCher2k_v2 1210 -#define RPC_cublasCher2k_v2_64 1211 -#define RPC_cublasZher2k_v2 1212 -#define RPC_cublasZher2k_v2_64 1213 -#define RPC_cublasSsyrkx 1214 -#define RPC_cublasSsyrkx_64 1215 -#define RPC_cublasDsyrkx 1216 -#define RPC_cublasDsyrkx_64 1217 -#define RPC_cublasCsyrkx 1218 -#define RPC_cublasCsyrkx_64 1219 -#define RPC_cublasZsyrkx 1220 -#define RPC_cublasZsyrkx_64 1221 -#define RPC_cublasCherkx 1222 -#define RPC_cublasCherkx_64 1223 -#define RPC_cublasZherkx 1224 -#define RPC_cublasZherkx_64 1225 -#define RPC_cublasSsymm_v2 1226 -#define RPC_cublasSsymm_v2_64 1227 -#define RPC_cublasDsymm_v2 1228 -#define RPC_cublasDsymm_v2_64 1229 -#define RPC_cublasCsymm_v2 1230 -#define RPC_cublasCsymm_v2_64 1231 -#define RPC_cublasZsymm_v2 1232 -#define RPC_cublasZsymm_v2_64 1233 -#define RPC_cublasChemm_v2 1234 -#define RPC_cublasChemm_v2_64 1235 -#define RPC_cublasZhemm_v2 1236 -#define RPC_cublasZhemm_v2_64 1237 -#define RPC_cublasStrsm_v2 1238 -#define RPC_cublasStrsm_v2_64 1239 -#define RPC_cublasDtrsm_v2 1240 -#define RPC_cublasDtrsm_v2_64 1241 -#define RPC_cublasCtrsm_v2 1242 -#define RPC_cublasCtrsm_v2_64 1243 -#define RPC_cublasZtrsm_v2 1244 -#define RPC_cublasZtrsm_v2_64 1245 -#define RPC_cublasStrmm_v2 1246 -#define RPC_cublasStrmm_v2_64 1247 -#define RPC_cublasDtrmm_v2 1248 -#define RPC_cublasDtrmm_v2_64 1249 -#define RPC_cublasCtrmm_v2 1250 -#define RPC_cublasCtrmm_v2_64 1251 -#define RPC_cublasZtrmm_v2 1252 -#define RPC_cublasZtrmm_v2_64 1253 -#define RPC_cublasHgemmBatched 1254 -#define RPC_cublasHgemmBatched_64 1255 -#define RPC_cublasSgemmBatched 1256 -#define RPC_cublasSgemmBatched_64 1257 -#define RPC_cublasDgemmBatched 1258 -#define RPC_cublasDgemmBatched_64 1259 -#define RPC_cublasCgemmBatched 1260 -#define RPC_cublasCgemmBatched_64 1261 -#define RPC_cublasCgemm3mBatched 1262 -#define RPC_cublasCgemm3mBatched_64 1263 -#define RPC_cublasZgemmBatched 1264 -#define RPC_cublasZgemmBatched_64 1265 -#define RPC_cublasHgemmStridedBatched 1266 -#define RPC_cublasHgemmStridedBatched_64 1267 -#define RPC_cublasSgemmStridedBatched 1268 -#define RPC_cublasSgemmStridedBatched_64 1269 -#define RPC_cublasDgemmStridedBatched 1270 -#define RPC_cublasDgemmStridedBatched_64 1271 -#define RPC_cublasCgemmStridedBatched 1272 -#define RPC_cublasCgemmStridedBatched_64 1273 -#define RPC_cublasCgemm3mStridedBatched 1274 -#define RPC_cublasCgemm3mStridedBatched_64 1275 -#define RPC_cublasZgemmStridedBatched 1276 -#define RPC_cublasZgemmStridedBatched_64 1277 -#define RPC_cublasGemmBatchedEx 1278 -#define RPC_cublasGemmBatchedEx_64 1279 -#define RPC_cublasSgeam 1280 -#define RPC_cublasSgeam_64 1281 -#define RPC_cublasDgeam 1282 -#define RPC_cublasDgeam_64 1283 -#define RPC_cublasCgeam 1284 -#define RPC_cublasCgeam_64 1285 -#define RPC_cublasZgeam 1286 -#define RPC_cublasZgeam_64 1287 -#define RPC_cublasStrsmBatched 1288 -#define RPC_cublasStrsmBatched_64 1289 -#define RPC_cublasDtrsmBatched 1290 -#define RPC_cublasDtrsmBatched_64 1291 -#define RPC_cublasCtrsmBatched 1292 -#define RPC_cublasCtrsmBatched_64 1293 -#define RPC_cublasZtrsmBatched 1294 -#define RPC_cublasZtrsmBatched_64 1295 -#define RPC_cublasSdgmm 1296 -#define RPC_cublasSdgmm_64 1297 -#define RPC_cublasDdgmm 1298 -#define RPC_cublasDdgmm_64 1299 -#define RPC_cublasCdgmm 1300 -#define RPC_cublasCdgmm_64 1301 -#define RPC_cublasZdgmm 1302 -#define RPC_cublasZdgmm_64 1303 -#define RPC_cublasSmatinvBatched 1304 -#define RPC_cublasDmatinvBatched 1305 -#define RPC_cublasCmatinvBatched 1306 -#define RPC_cublasZmatinvBatched 1307 -#define RPC_cublasSgeqrfBatched 1308 -#define RPC_cublasDgeqrfBatched 1309 -#define RPC_cublasCgeqrfBatched 1310 -#define RPC_cublasZgeqrfBatched 1311 -#define RPC_cublasSgelsBatched 1312 -#define RPC_cublasDgelsBatched 1313 -#define RPC_cublasCgelsBatched 1314 -#define RPC_cublasZgelsBatched 1315 -#define RPC_cublasStpttr 1316 -#define RPC_cublasDtpttr 1317 -#define RPC_cublasCtpttr 1318 -#define RPC_cublasZtpttr 1319 -#define RPC_cublasStrttp 1320 -#define RPC_cublasDtrttp 1321 -#define RPC_cublasCtrttp 1322 -#define RPC_cublasZtrttp 1323 -#define RPC_cublasSgetriBatched 1324 -#define RPC_cublasDgetriBatched 1325 -#define RPC_cublasCgetriBatched 1326 -#define RPC_cublasZgetriBatched 1327 -#define RPC_cublasSgetrsBatched 1328 -#define RPC_cublasDgetrsBatched 1329 -#define RPC_cublasCgetrsBatched 1330 -#define RPC_cublasZgetrsBatched 1331 -#define RPC_cublasUint8gemmBias 1332 -#define RPC_cublasMigrateComputeType 1333 -#define RPC_cudnnGetVersion 1334 -#define RPC_cudnnGetMaxDeviceVersion 1335 -#define RPC_cudnnGetCudartVersion 1336 -#define RPC_cudnnGetErrorString 1337 -#define RPC_cudnnGetLastErrorString 1338 -#define RPC_cudnnQueryRuntimeError 1339 -#define RPC_cudnnGetProperty 1340 -#define RPC_cudnnCreate 1341 -#define RPC_cudnnDestroy 1342 -#define RPC_cudnnSetStream 1343 -#define RPC_cudnnGetStream 1344 -#define RPC_cudnnGetCallback 1345 -#define RPC_cudnnGraphVersionCheck 1346 -#define RPC_cudnnBackendCreateDescriptor 1347 -#define RPC_cudnnBackendDestroyDescriptor 1348 -#define RPC_cudnnBackendInitialize 1349 -#define RPC_cudnnBackendFinalize 1350 -#define RPC_cudnnBackendSetAttribute 1351 -#define RPC_cudnnBackendExecute 1352 -#define RPC_cudnnBackendPopulateCudaGraph 1353 -#define RPC_cudnnBackendUpdateCudaGraph 1354 -#define RPC_cudnnCreateTensorDescriptor 1355 -#define RPC_cudnnSetTensor4dDescriptor 1356 -#define RPC_cudnnSetTensor4dDescriptorEx 1357 -#define RPC_cudnnGetTensor4dDescriptor 1358 -#define RPC_cudnnGetTensorSizeInBytes 1359 -#define RPC_cudnnDestroyTensorDescriptor 1360 -#define RPC_cudnnInitTransformDest 1361 -#define RPC_cudnnCreateTensorTransformDescriptor 1362 -#define RPC_cudnnDestroyTensorTransformDescriptor 1363 -#define RPC_cudnnCreateOpTensorDescriptor 1364 -#define RPC_cudnnSetOpTensorDescriptor 1365 -#define RPC_cudnnGetOpTensorDescriptor 1366 -#define RPC_cudnnDestroyOpTensorDescriptor 1367 -#define RPC_cudnnCreateReduceTensorDescriptor 1368 -#define RPC_cudnnSetReduceTensorDescriptor 1369 -#define RPC_cudnnGetReduceTensorDescriptor 1370 -#define RPC_cudnnDestroyReduceTensorDescriptor 1371 -#define RPC_cudnnGetReductionIndicesSize 1372 -#define RPC_cudnnGetReductionWorkspaceSize 1373 -#define RPC_cudnnCreateFilterDescriptor 1374 -#define RPC_cudnnSetFilter4dDescriptor 1375 -#define RPC_cudnnGetFilter4dDescriptor 1376 -#define RPC_cudnnGetFilterSizeInBytes 1377 -#define RPC_cudnnDestroyFilterDescriptor 1378 -#define RPC_cudnnCreatePoolingDescriptor 1379 -#define RPC_cudnnSetPooling2dDescriptor 1380 -#define RPC_cudnnGetPooling2dDescriptor 1381 -#define RPC_cudnnGetPooling2dForwardOutputDim 1382 -#define RPC_cudnnDestroyPoolingDescriptor 1383 -#define RPC_cudnnCreateActivationDescriptor 1384 -#define RPC_cudnnSetActivationDescriptor 1385 -#define RPC_cudnnGetActivationDescriptor 1386 -#define RPC_cudnnSetActivationDescriptorSwishBeta 1387 -#define RPC_cudnnGetActivationDescriptorSwishBeta 1388 -#define RPC_cudnnDestroyActivationDescriptor 1389 -#define RPC_cudnnActivationForward 1390 -#define RPC_cudnnCreateLRNDescriptor 1391 -#define RPC_cudnnSetLRNDescriptor 1392 -#define RPC_cudnnGetLRNDescriptor 1393 -#define RPC_cudnnDestroyLRNDescriptor 1394 -#define RPC_cudnnDeriveBNTensorDescriptor 1395 -#define RPC_cudnnDeriveNormTensorDescriptor 1396 -#define RPC_cudnnCreateSpatialTransformerDescriptor 1397 -#define RPC_cudnnDestroySpatialTransformerDescriptor 1398 -#define RPC_cudnnCreateDropoutDescriptor 1399 -#define RPC_cudnnDestroyDropoutDescriptor 1400 -#define RPC_cudnnDropoutGetStatesSize 1401 -#define RPC_cudnnDropoutGetReserveSpaceSize 1402 -#define RPC_cudnnGetDropoutDescriptor 1403 -#define RPC_cudnnOpsVersionCheck 1404 -#define RPC_cudnnGetBatchNormalizationForwardTrainingExWorkspaceSize 1405 -#define RPC_cudnnGetBatchNormalizationBackwardExWorkspaceSize 1406 -#define RPC_cudnnGetBatchNormalizationTrainingExReserveSpaceSize 1407 -#define RPC_cudnnGetNormalizationForwardTrainingWorkspaceSize 1408 -#define RPC_cudnnGetNormalizationBackwardWorkspaceSize 1409 -#define RPC_cudnnGetNormalizationTrainingReserveSpaceSize 1410 +#define RPC_cudaMemset 770 +#define RPC_cudaMemset2D 771 +#define RPC_cudaMemset3D 772 +#define RPC_cudaMemsetAsync 773 +#define RPC_cudaMemset2DAsync 774 +#define RPC_cudaMemset3DAsync 775 +#define RPC_cudaGetSymbolAddress 776 +#define RPC_cudaGetSymbolSize 777 +#define RPC_cudaMemPrefetchAsync 778 +#define RPC_cudaMemAdvise 779 +#define RPC_cudaMemRangeGetAttributes 780 +#define RPC_cudaMemcpyToArray 781 +#define RPC_cudaMemcpyArrayToArray 782 +#define RPC_cudaMemcpyToArrayAsync 783 +#define RPC_cudaMallocAsync 784 +#define RPC_cudaMemPoolTrimTo 785 +#define RPC_cudaMemPoolSetAccess 786 +#define RPC_cudaMemPoolGetAccess 787 +#define RPC_cudaMemPoolCreate 788 +#define RPC_cudaMemPoolDestroy 789 +#define RPC_cudaMallocFromPoolAsync 790 +#define RPC_cudaMemPoolImportPointer 791 +#define RPC_cudaPointerGetAttributes 792 +#define RPC_cudaDeviceCanAccessPeer 793 +#define RPC_cudaDeviceEnablePeerAccess 794 +#define RPC_cudaDeviceDisablePeerAccess 795 +#define RPC_cudaGraphicsUnregisterResource 796 +#define RPC_cudaGraphicsResourceSetMapFlags 797 +#define RPC_cudaGraphicsMapResources 798 +#define RPC_cudaGraphicsUnmapResources 799 +#define RPC_cudaGraphicsResourceGetMappedPointer 800 +#define RPC_cudaGraphicsSubResourceGetMappedArray 801 +#define RPC_cudaGraphicsResourceGetMappedMipmappedArray 802 +#define RPC_cudaGetChannelDesc 803 +#define RPC_cudaCreateChannelDesc 804 +#define RPC_cudaCreateTextureObject 805 +#define RPC_cudaDestroyTextureObject 806 +#define RPC_cudaGetTextureObjectResourceDesc 807 +#define RPC_cudaGetTextureObjectTextureDesc 808 +#define RPC_cudaGetTextureObjectResourceViewDesc 809 +#define RPC_cudaCreateSurfaceObject 810 +#define RPC_cudaDestroySurfaceObject 811 +#define RPC_cudaGetSurfaceObjectResourceDesc 812 +#define RPC_cudaDriverGetVersion 813 +#define RPC_cudaRuntimeGetVersion 814 +#define RPC_cudaGraphCreate 815 +#define RPC_cudaGraphAddKernelNode 816 +#define RPC_cudaGraphKernelNodeGetParams 817 +#define RPC_cudaGraphKernelNodeSetParams 818 +#define RPC_cudaGraphKernelNodeCopyAttributes 819 +#define RPC_cudaGraphKernelNodeGetAttribute 820 +#define RPC_cudaGraphKernelNodeSetAttribute 821 +#define RPC_cudaGraphAddMemcpyNode 822 +#define RPC_cudaGraphAddMemcpyNodeToSymbol 823 +#define RPC_cudaGraphMemcpyNodeGetParams 824 +#define RPC_cudaGraphMemcpyNodeSetParams 825 +#define RPC_cudaGraphMemcpyNodeSetParamsToSymbol 826 +#define RPC_cudaGraphAddMemsetNode 827 +#define RPC_cudaGraphMemsetNodeGetParams 828 +#define RPC_cudaGraphMemsetNodeSetParams 829 +#define RPC_cudaGraphAddHostNode 830 +#define RPC_cudaGraphHostNodeGetParams 831 +#define RPC_cudaGraphHostNodeSetParams 832 +#define RPC_cudaGraphAddChildGraphNode 833 +#define RPC_cudaGraphChildGraphNodeGetGraph 834 +#define RPC_cudaGraphAddEmptyNode 835 +#define RPC_cudaGraphAddEventRecordNode 836 +#define RPC_cudaGraphEventRecordNodeGetEvent 837 +#define RPC_cudaGraphEventRecordNodeSetEvent 838 +#define RPC_cudaGraphAddEventWaitNode 839 +#define RPC_cudaGraphEventWaitNodeGetEvent 840 +#define RPC_cudaGraphEventWaitNodeSetEvent 841 +#define RPC_cudaGraphAddExternalSemaphoresSignalNode 842 +#define RPC_cudaGraphExternalSemaphoresSignalNodeGetParams 843 +#define RPC_cudaGraphExternalSemaphoresSignalNodeSetParams 844 +#define RPC_cudaGraphAddExternalSemaphoresWaitNode 845 +#define RPC_cudaGraphExternalSemaphoresWaitNodeGetParams 846 +#define RPC_cudaGraphExternalSemaphoresWaitNodeSetParams 847 +#define RPC_cudaGraphAddMemAllocNode 848 +#define RPC_cudaGraphMemAllocNodeGetParams 849 +#define RPC_cudaDeviceGraphMemTrim 850 +#define RPC_cudaGraphClone 851 +#define RPC_cudaGraphNodeFindInClone 852 +#define RPC_cudaGraphNodeGetType 853 +#define RPC_cudaGraphGetNodes 854 +#define RPC_cudaGraphGetRootNodes 855 +#define RPC_cudaGraphGetEdges 856 +#define RPC_cudaGraphNodeGetDependencies 857 +#define RPC_cudaGraphNodeGetDependentNodes 858 +#define RPC_cudaGraphAddDependencies 859 +#define RPC_cudaGraphRemoveDependencies 860 +#define RPC_cudaGraphDestroyNode 861 +#define RPC_cudaGraphInstantiate 862 +#define RPC_cudaGraphInstantiateWithFlags 863 +#define RPC_cudaGraphInstantiateWithParams 864 +#define RPC_cudaGraphExecGetFlags 865 +#define RPC_cudaGraphExecKernelNodeSetParams 866 +#define RPC_cudaGraphExecMemcpyNodeSetParams 867 +#define RPC_cudaGraphExecMemcpyNodeSetParamsToSymbol 868 +#define RPC_cudaGraphExecMemsetNodeSetParams 869 +#define RPC_cudaGraphExecHostNodeSetParams 870 +#define RPC_cudaGraphExecChildGraphNodeSetParams 871 +#define RPC_cudaGraphExecEventRecordNodeSetEvent 872 +#define RPC_cudaGraphExecEventWaitNodeSetEvent 873 +#define RPC_cudaGraphExecExternalSemaphoresSignalNodeSetParams 874 +#define RPC_cudaGraphExecExternalSemaphoresWaitNodeSetParams 875 +#define RPC_cudaGraphNodeSetEnabled 876 +#define RPC_cudaGraphNodeGetEnabled 877 +#define RPC_cudaGraphExecUpdate 878 +#define RPC_cudaGraphUpload 879 +#define RPC_cudaGraphLaunch 880 +#define RPC_cudaGraphExecDestroy 881 +#define RPC_cudaGraphDestroy 882 +#define RPC_cudaGraphDebugDotPrint 883 +#define RPC_cudaUserObjectRetain 884 +#define RPC_cudaUserObjectRelease 885 +#define RPC_cudaGraphRetainUserObject 886 +#define RPC_cudaGraphReleaseUserObject 887 +#define RPC_cudaGetDriverEntryPoint 888 +#define RPC_cudaGetExportTable 889 +#define RPC_cudaGetFuncBySymbol 890 +#define RPC_cublasCreate_v2 891 +#define RPC_cublasDestroy_v2 892 +#define RPC_cublasGetVersion_v2 893 +#define RPC_cublasGetProperty 894 +#define RPC_cublasGetCudartVersion 895 +#define RPC_cublasSetStream_v2 896 +#define RPC_cublasGetStream_v2 897 +#define RPC_cublasGetPointerMode_v2 898 +#define RPC_cublasSetPointerMode_v2 899 +#define RPC_cublasGetAtomicsMode 900 +#define RPC_cublasSetAtomicsMode 901 +#define RPC_cublasGetMathMode 902 +#define RPC_cublasSetMathMode 903 +#define RPC_cublasGetSmCountTarget 904 +#define RPC_cublasSetSmCountTarget 905 +#define RPC_cublasGetStatusName 906 +#define RPC_cublasGetStatusString 907 +#define RPC_cublasLoggerConfigure 908 +#define RPC_cublasSetLoggerCallback 909 +#define RPC_cublasGetLoggerCallback 910 +#define RPC_cublasXerbla 911 +#define RPC_cublasSnrm2_v2 912 +#define RPC_cublasSnrm2_v2_64 913 +#define RPC_cublasDnrm2_v2 914 +#define RPC_cublasDnrm2_v2_64 915 +#define RPC_cublasScnrm2_v2 916 +#define RPC_cublasScnrm2_v2_64 917 +#define RPC_cublasDznrm2_v2 918 +#define RPC_cublasDznrm2_v2_64 919 +#define RPC_cublasSdot_v2 920 +#define RPC_cublasSdot_v2_64 921 +#define RPC_cublasDdot_v2 922 +#define RPC_cublasDdot_v2_64 923 +#define RPC_cublasCdotu_v2 924 +#define RPC_cublasCdotu_v2_64 925 +#define RPC_cublasCdotc_v2 926 +#define RPC_cublasCdotc_v2_64 927 +#define RPC_cublasZdotu_v2 928 +#define RPC_cublasZdotu_v2_64 929 +#define RPC_cublasZdotc_v2 930 +#define RPC_cublasZdotc_v2_64 931 +#define RPC_cublasSscal_v2 932 +#define RPC_cublasSscal_v2_64 933 +#define RPC_cublasDscal_v2 934 +#define RPC_cublasDscal_v2_64 935 +#define RPC_cublasCscal_v2 936 +#define RPC_cublasCscal_v2_64 937 +#define RPC_cublasCsscal_v2 938 +#define RPC_cublasCsscal_v2_64 939 +#define RPC_cublasZscal_v2 940 +#define RPC_cublasZscal_v2_64 941 +#define RPC_cublasZdscal_v2 942 +#define RPC_cublasZdscal_v2_64 943 +#define RPC_cublasSaxpy_v2 944 +#define RPC_cublasSaxpy_v2_64 945 +#define RPC_cublasDaxpy_v2 946 +#define RPC_cublasDaxpy_v2_64 947 +#define RPC_cublasCaxpy_v2 948 +#define RPC_cublasCaxpy_v2_64 949 +#define RPC_cublasZaxpy_v2 950 +#define RPC_cublasZaxpy_v2_64 951 +#define RPC_cublasScopy_v2 952 +#define RPC_cublasScopy_v2_64 953 +#define RPC_cublasDcopy_v2 954 +#define RPC_cublasDcopy_v2_64 955 +#define RPC_cublasCcopy_v2 956 +#define RPC_cublasCcopy_v2_64 957 +#define RPC_cublasZcopy_v2 958 +#define RPC_cublasZcopy_v2_64 959 +#define RPC_cublasSswap_v2 960 +#define RPC_cublasSswap_v2_64 961 +#define RPC_cublasDswap_v2 962 +#define RPC_cublasDswap_v2_64 963 +#define RPC_cublasCswap_v2 964 +#define RPC_cublasCswap_v2_64 965 +#define RPC_cublasZswap_v2 966 +#define RPC_cublasZswap_v2_64 967 +#define RPC_cublasIsamax_v2 968 +#define RPC_cublasIsamax_v2_64 969 +#define RPC_cublasIdamax_v2 970 +#define RPC_cublasIdamax_v2_64 971 +#define RPC_cublasIcamax_v2 972 +#define RPC_cublasIcamax_v2_64 973 +#define RPC_cublasIzamax_v2 974 +#define RPC_cublasIzamax_v2_64 975 +#define RPC_cublasIamaxEx 976 +#define RPC_cublasIamaxEx_64 977 +#define RPC_cublasIsamin_v2 978 +#define RPC_cublasIsamin_v2_64 979 +#define RPC_cublasIdamin_v2 980 +#define RPC_cublasIdamin_v2_64 981 +#define RPC_cublasIcamin_v2 982 +#define RPC_cublasIcamin_v2_64 983 +#define RPC_cublasIzamin_v2 984 +#define RPC_cublasIzamin_v2_64 985 +#define RPC_cublasIaminEx 986 +#define RPC_cublasIaminEx_64 987 +#define RPC_cublasSasum_v2 988 +#define RPC_cublasSasum_v2_64 989 +#define RPC_cublasDasum_v2 990 +#define RPC_cublasDasum_v2_64 991 +#define RPC_cublasScasum_v2 992 +#define RPC_cublasScasum_v2_64 993 +#define RPC_cublasDzasum_v2 994 +#define RPC_cublasDzasum_v2_64 995 +#define RPC_cublasSrot_v2 996 +#define RPC_cublasSrot_v2_64 997 +#define RPC_cublasDrot_v2 998 +#define RPC_cublasDrot_v2_64 999 +#define RPC_cublasCrot_v2 1000 +#define RPC_cublasCrot_v2_64 1001 +#define RPC_cublasCsrot_v2 1002 +#define RPC_cublasCsrot_v2_64 1003 +#define RPC_cublasZrot_v2 1004 +#define RPC_cublasZrot_v2_64 1005 +#define RPC_cublasZdrot_v2 1006 +#define RPC_cublasZdrot_v2_64 1007 +#define RPC_cublasSrotg_v2 1008 +#define RPC_cublasDrotg_v2 1009 +#define RPC_cublasCrotg_v2 1010 +#define RPC_cublasZrotg_v2 1011 +#define RPC_cublasSrotm_v2 1012 +#define RPC_cublasSrotm_v2_64 1013 +#define RPC_cublasDrotm_v2 1014 +#define RPC_cublasDrotm_v2_64 1015 +#define RPC_cublasSrotmg_v2 1016 +#define RPC_cublasDrotmg_v2 1017 +#define RPC_cublasSgemv_v2 1018 +#define RPC_cublasSgemv_v2_64 1019 +#define RPC_cublasDgemv_v2 1020 +#define RPC_cublasDgemv_v2_64 1021 +#define RPC_cublasCgemv_v2 1022 +#define RPC_cublasCgemv_v2_64 1023 +#define RPC_cublasZgemv_v2 1024 +#define RPC_cublasZgemv_v2_64 1025 +#define RPC_cublasSgbmv_v2 1026 +#define RPC_cublasSgbmv_v2_64 1027 +#define RPC_cublasDgbmv_v2 1028 +#define RPC_cublasDgbmv_v2_64 1029 +#define RPC_cublasCgbmv_v2 1030 +#define RPC_cublasCgbmv_v2_64 1031 +#define RPC_cublasZgbmv_v2 1032 +#define RPC_cublasZgbmv_v2_64 1033 +#define RPC_cublasStrmv_v2 1034 +#define RPC_cublasStrmv_v2_64 1035 +#define RPC_cublasDtrmv_v2 1036 +#define RPC_cublasDtrmv_v2_64 1037 +#define RPC_cublasCtrmv_v2 1038 +#define RPC_cublasCtrmv_v2_64 1039 +#define RPC_cublasZtrmv_v2 1040 +#define RPC_cublasZtrmv_v2_64 1041 +#define RPC_cublasStbmv_v2 1042 +#define RPC_cublasStbmv_v2_64 1043 +#define RPC_cublasDtbmv_v2 1044 +#define RPC_cublasDtbmv_v2_64 1045 +#define RPC_cublasCtbmv_v2 1046 +#define RPC_cublasCtbmv_v2_64 1047 +#define RPC_cublasZtbmv_v2 1048 +#define RPC_cublasZtbmv_v2_64 1049 +#define RPC_cublasStpmv_v2 1050 +#define RPC_cublasStpmv_v2_64 1051 +#define RPC_cublasDtpmv_v2 1052 +#define RPC_cublasDtpmv_v2_64 1053 +#define RPC_cublasCtpmv_v2 1054 +#define RPC_cublasCtpmv_v2_64 1055 +#define RPC_cublasZtpmv_v2 1056 +#define RPC_cublasZtpmv_v2_64 1057 +#define RPC_cublasStrsv_v2 1058 +#define RPC_cublasStrsv_v2_64 1059 +#define RPC_cublasDtrsv_v2 1060 +#define RPC_cublasDtrsv_v2_64 1061 +#define RPC_cublasCtrsv_v2 1062 +#define RPC_cublasCtrsv_v2_64 1063 +#define RPC_cublasZtrsv_v2 1064 +#define RPC_cublasZtrsv_v2_64 1065 +#define RPC_cublasStpsv_v2 1066 +#define RPC_cublasStpsv_v2_64 1067 +#define RPC_cublasDtpsv_v2 1068 +#define RPC_cublasDtpsv_v2_64 1069 +#define RPC_cublasCtpsv_v2 1070 +#define RPC_cublasCtpsv_v2_64 1071 +#define RPC_cublasZtpsv_v2 1072 +#define RPC_cublasZtpsv_v2_64 1073 +#define RPC_cublasStbsv_v2 1074 +#define RPC_cublasStbsv_v2_64 1075 +#define RPC_cublasDtbsv_v2 1076 +#define RPC_cublasDtbsv_v2_64 1077 +#define RPC_cublasCtbsv_v2 1078 +#define RPC_cublasCtbsv_v2_64 1079 +#define RPC_cublasZtbsv_v2 1080 +#define RPC_cublasZtbsv_v2_64 1081 +#define RPC_cublasSsymv_v2 1082 +#define RPC_cublasSsymv_v2_64 1083 +#define RPC_cublasDsymv_v2 1084 +#define RPC_cublasDsymv_v2_64 1085 +#define RPC_cublasCsymv_v2 1086 +#define RPC_cublasCsymv_v2_64 1087 +#define RPC_cublasZsymv_v2 1088 +#define RPC_cublasZsymv_v2_64 1089 +#define RPC_cublasChemv_v2 1090 +#define RPC_cublasChemv_v2_64 1091 +#define RPC_cublasZhemv_v2 1092 +#define RPC_cublasZhemv_v2_64 1093 +#define RPC_cublasSsbmv_v2 1094 +#define RPC_cublasSsbmv_v2_64 1095 +#define RPC_cublasDsbmv_v2 1096 +#define RPC_cublasDsbmv_v2_64 1097 +#define RPC_cublasChbmv_v2 1098 +#define RPC_cublasChbmv_v2_64 1099 +#define RPC_cublasZhbmv_v2 1100 +#define RPC_cublasZhbmv_v2_64 1101 +#define RPC_cublasSspmv_v2 1102 +#define RPC_cublasSspmv_v2_64 1103 +#define RPC_cublasDspmv_v2 1104 +#define RPC_cublasDspmv_v2_64 1105 +#define RPC_cublasChpmv_v2 1106 +#define RPC_cublasChpmv_v2_64 1107 +#define RPC_cublasZhpmv_v2 1108 +#define RPC_cublasZhpmv_v2_64 1109 +#define RPC_cublasSger_v2 1110 +#define RPC_cublasSger_v2_64 1111 +#define RPC_cublasDger_v2 1112 +#define RPC_cublasDger_v2_64 1113 +#define RPC_cublasCgeru_v2 1114 +#define RPC_cublasCgeru_v2_64 1115 +#define RPC_cublasCgerc_v2 1116 +#define RPC_cublasCgerc_v2_64 1117 +#define RPC_cublasZgeru_v2 1118 +#define RPC_cublasZgeru_v2_64 1119 +#define RPC_cublasZgerc_v2 1120 +#define RPC_cublasZgerc_v2_64 1121 +#define RPC_cublasSsyr_v2 1122 +#define RPC_cublasSsyr_v2_64 1123 +#define RPC_cublasDsyr_v2 1124 +#define RPC_cublasDsyr_v2_64 1125 +#define RPC_cublasCsyr_v2 1126 +#define RPC_cublasCsyr_v2_64 1127 +#define RPC_cublasZsyr_v2 1128 +#define RPC_cublasZsyr_v2_64 1129 +#define RPC_cublasCher_v2 1130 +#define RPC_cublasCher_v2_64 1131 +#define RPC_cublasZher_v2 1132 +#define RPC_cublasZher_v2_64 1133 +#define RPC_cublasSspr_v2 1134 +#define RPC_cublasSspr_v2_64 1135 +#define RPC_cublasDspr_v2 1136 +#define RPC_cublasDspr_v2_64 1137 +#define RPC_cublasChpr_v2 1138 +#define RPC_cublasChpr_v2_64 1139 +#define RPC_cublasZhpr_v2 1140 +#define RPC_cublasZhpr_v2_64 1141 +#define RPC_cublasSsyr2_v2 1142 +#define RPC_cublasSsyr2_v2_64 1143 +#define RPC_cublasDsyr2_v2 1144 +#define RPC_cublasDsyr2_v2_64 1145 +#define RPC_cublasCsyr2_v2 1146 +#define RPC_cublasCsyr2_v2_64 1147 +#define RPC_cublasZsyr2_v2 1148 +#define RPC_cublasZsyr2_v2_64 1149 +#define RPC_cublasCher2_v2 1150 +#define RPC_cublasCher2_v2_64 1151 +#define RPC_cublasZher2_v2 1152 +#define RPC_cublasZher2_v2_64 1153 +#define RPC_cublasSspr2_v2 1154 +#define RPC_cublasSspr2_v2_64 1155 +#define RPC_cublasDspr2_v2 1156 +#define RPC_cublasDspr2_v2_64 1157 +#define RPC_cublasChpr2_v2 1158 +#define RPC_cublasChpr2_v2_64 1159 +#define RPC_cublasZhpr2_v2 1160 +#define RPC_cublasZhpr2_v2_64 1161 +#define RPC_cublasSgemvBatched 1162 +#define RPC_cublasTSTgemvBatched 1163 +#define RPC_cublasSgemvStridedBatched 1164 +#define RPC_cublasSgemvStridedBatched_64 1165 +#define RPC_cublasDgemvStridedBatched 1166 +#define RPC_cublasDgemvStridedBatched_64 1167 +#define RPC_cublasCgemvStridedBatched 1168 +#define RPC_cublasCgemvStridedBatched_64 1169 +#define RPC_cublasZgemvStridedBatched 1170 +#define RPC_cublasZgemvStridedBatched_64 1171 +#define RPC_cublasHSHgemvStridedBatched 1172 +#define RPC_cublasHSHgemvStridedBatched_64 1173 +#define RPC_cublasHSSgemvStridedBatched 1174 +#define RPC_cublasHSSgemvStridedBatched_64 1175 +#define RPC_cublasTSTgemvStridedBatched 1176 +#define RPC_cublasTSTgemvStridedBatched_64 1177 +#define RPC_cublasTSSgemvStridedBatched 1178 +#define RPC_cublasTSSgemvStridedBatched_64 1179 +#define RPC_cublasSgemm_v2 1180 +#define RPC_cublasSgemm_v2_64 1181 +#define RPC_cublasDgemm_v2 1182 +#define RPC_cublasDgemm_v2_64 1183 +#define RPC_cublasCgemm_v2 1184 +#define RPC_cublasCgemm_v2_64 1185 +#define RPC_cublasCgemm3m 1186 +#define RPC_cublasCgemm3m_64 1187 +#define RPC_cublasZgemm_v2 1188 +#define RPC_cublasZgemm_v2_64 1189 +#define RPC_cublasZgemm3m 1190 +#define RPC_cublasZgemm3m_64 1191 +#define RPC_cublasHgemm 1192 +#define RPC_cublasHgemm_64 1193 +#define RPC_cublasSsyrk_v2 1194 +#define RPC_cublasSsyrk_v2_64 1195 +#define RPC_cublasDsyrk_v2 1196 +#define RPC_cublasDsyrk_v2_64 1197 +#define RPC_cublasCsyrk_v2 1198 +#define RPC_cublasCsyrk_v2_64 1199 +#define RPC_cublasZsyrk_v2 1200 +#define RPC_cublasZsyrk_v2_64 1201 +#define RPC_cublasCherk_v2 1202 +#define RPC_cublasCherk_v2_64 1203 +#define RPC_cublasZherk_v2 1204 +#define RPC_cublasZherk_v2_64 1205 +#define RPC_cublasSsyr2k_v2 1206 +#define RPC_cublasSsyr2k_v2_64 1207 +#define RPC_cublasDsyr2k_v2 1208 +#define RPC_cublasDsyr2k_v2_64 1209 +#define RPC_cublasCsyr2k_v2 1210 +#define RPC_cublasCsyr2k_v2_64 1211 +#define RPC_cublasZsyr2k_v2 1212 +#define RPC_cublasZsyr2k_v2_64 1213 +#define RPC_cublasCher2k_v2 1214 +#define RPC_cublasCher2k_v2_64 1215 +#define RPC_cublasZher2k_v2 1216 +#define RPC_cublasZher2k_v2_64 1217 +#define RPC_cublasSsyrkx 1218 +#define RPC_cublasSsyrkx_64 1219 +#define RPC_cublasDsyrkx 1220 +#define RPC_cublasDsyrkx_64 1221 +#define RPC_cublasCsyrkx 1222 +#define RPC_cublasCsyrkx_64 1223 +#define RPC_cublasZsyrkx 1224 +#define RPC_cublasZsyrkx_64 1225 +#define RPC_cublasCherkx 1226 +#define RPC_cublasCherkx_64 1227 +#define RPC_cublasZherkx 1228 +#define RPC_cublasZherkx_64 1229 +#define RPC_cublasSsymm_v2 1230 +#define RPC_cublasSsymm_v2_64 1231 +#define RPC_cublasDsymm_v2 1232 +#define RPC_cublasDsymm_v2_64 1233 +#define RPC_cublasCsymm_v2 1234 +#define RPC_cublasCsymm_v2_64 1235 +#define RPC_cublasZsymm_v2 1236 +#define RPC_cublasZsymm_v2_64 1237 +#define RPC_cublasChemm_v2 1238 +#define RPC_cublasChemm_v2_64 1239 +#define RPC_cublasZhemm_v2 1240 +#define RPC_cublasZhemm_v2_64 1241 +#define RPC_cublasStrsm_v2 1242 +#define RPC_cublasStrsm_v2_64 1243 +#define RPC_cublasDtrsm_v2 1244 +#define RPC_cublasDtrsm_v2_64 1245 +#define RPC_cublasCtrsm_v2 1246 +#define RPC_cublasCtrsm_v2_64 1247 +#define RPC_cublasZtrsm_v2 1248 +#define RPC_cublasZtrsm_v2_64 1249 +#define RPC_cublasStrmm_v2 1250 +#define RPC_cublasStrmm_v2_64 1251 +#define RPC_cublasDtrmm_v2 1252 +#define RPC_cublasDtrmm_v2_64 1253 +#define RPC_cublasCtrmm_v2 1254 +#define RPC_cublasCtrmm_v2_64 1255 +#define RPC_cublasZtrmm_v2 1256 +#define RPC_cublasZtrmm_v2_64 1257 +#define RPC_cublasHgemmBatched 1258 +#define RPC_cublasHgemmBatched_64 1259 +#define RPC_cublasSgemmBatched 1260 +#define RPC_cublasSgemmBatched_64 1261 +#define RPC_cublasDgemmBatched 1262 +#define RPC_cublasDgemmBatched_64 1263 +#define RPC_cublasCgemmBatched 1264 +#define RPC_cublasCgemmBatched_64 1265 +#define RPC_cublasCgemm3mBatched 1266 +#define RPC_cublasCgemm3mBatched_64 1267 +#define RPC_cublasZgemmBatched 1268 +#define RPC_cublasZgemmBatched_64 1269 +#define RPC_cublasHgemmStridedBatched 1270 +#define RPC_cublasHgemmStridedBatched_64 1271 +#define RPC_cublasSgemmStridedBatched 1272 +#define RPC_cublasSgemmStridedBatched_64 1273 +#define RPC_cublasDgemmStridedBatched 1274 +#define RPC_cublasDgemmStridedBatched_64 1275 +#define RPC_cublasCgemmStridedBatched 1276 +#define RPC_cublasCgemmStridedBatched_64 1277 +#define RPC_cublasCgemm3mStridedBatched 1278 +#define RPC_cublasCgemm3mStridedBatched_64 1279 +#define RPC_cublasZgemmStridedBatched 1280 +#define RPC_cublasZgemmStridedBatched_64 1281 +#define RPC_cublasGemmBatchedEx 1282 +#define RPC_cublasGemmBatchedEx_64 1283 +#define RPC_cublasSgeam 1284 +#define RPC_cublasSgeam_64 1285 +#define RPC_cublasDgeam 1286 +#define RPC_cublasDgeam_64 1287 +#define RPC_cublasCgeam 1288 +#define RPC_cublasCgeam_64 1289 +#define RPC_cublasZgeam 1290 +#define RPC_cublasZgeam_64 1291 +#define RPC_cublasStrsmBatched 1292 +#define RPC_cublasStrsmBatched_64 1293 +#define RPC_cublasDtrsmBatched 1294 +#define RPC_cublasDtrsmBatched_64 1295 +#define RPC_cublasCtrsmBatched 1296 +#define RPC_cublasCtrsmBatched_64 1297 +#define RPC_cublasZtrsmBatched 1298 +#define RPC_cublasZtrsmBatched_64 1299 +#define RPC_cublasSdgmm 1300 +#define RPC_cublasSdgmm_64 1301 +#define RPC_cublasDdgmm 1302 +#define RPC_cublasDdgmm_64 1303 +#define RPC_cublasCdgmm 1304 +#define RPC_cublasCdgmm_64 1305 +#define RPC_cublasZdgmm 1306 +#define RPC_cublasZdgmm_64 1307 +#define RPC_cublasSmatinvBatched 1308 +#define RPC_cublasDmatinvBatched 1309 +#define RPC_cublasCmatinvBatched 1310 +#define RPC_cublasZmatinvBatched 1311 +#define RPC_cublasSgeqrfBatched 1312 +#define RPC_cublasDgeqrfBatched 1313 +#define RPC_cublasCgeqrfBatched 1314 +#define RPC_cublasZgeqrfBatched 1315 +#define RPC_cublasSgelsBatched 1316 +#define RPC_cublasDgelsBatched 1317 +#define RPC_cublasCgelsBatched 1318 +#define RPC_cublasZgelsBatched 1319 +#define RPC_cublasStpttr 1320 +#define RPC_cublasDtpttr 1321 +#define RPC_cublasCtpttr 1322 +#define RPC_cublasZtpttr 1323 +#define RPC_cublasStrttp 1324 +#define RPC_cublasDtrttp 1325 +#define RPC_cublasCtrttp 1326 +#define RPC_cublasZtrttp 1327 +#define RPC_cublasSgetriBatched 1328 +#define RPC_cublasDgetriBatched 1329 +#define RPC_cublasCgetriBatched 1330 +#define RPC_cublasZgetriBatched 1331 +#define RPC_cublasSgetrsBatched 1332 +#define RPC_cublasDgetrsBatched 1333 +#define RPC_cublasCgetrsBatched 1334 +#define RPC_cublasZgetrsBatched 1335 +#define RPC_cublasUint8gemmBias 1336 +#define RPC_cublasMigrateComputeType 1337 +#define RPC_cudnnGetVersion 1338 +#define RPC_cudnnGetMaxDeviceVersion 1339 +#define RPC_cudnnGetCudartVersion 1340 +#define RPC_cudnnGetErrorString 1341 +#define RPC_cudnnGetLastErrorString 1342 +#define RPC_cudnnQueryRuntimeError 1343 +#define RPC_cudnnGetProperty 1344 +#define RPC_cudnnCreate 1345 +#define RPC_cudnnDestroy 1346 +#define RPC_cudnnSetStream 1347 +#define RPC_cudnnGetStream 1348 +#define RPC_cudnnGetCallback 1349 +#define RPC_cudnnGraphVersionCheck 1350 +#define RPC_cudnnBackendCreateDescriptor 1351 +#define RPC_cudnnBackendDestroyDescriptor 1352 +#define RPC_cudnnBackendInitialize 1353 +#define RPC_cudnnBackendFinalize 1354 +#define RPC_cudnnBackendSetAttribute 1355 +#define RPC_cudnnBackendExecute 1356 +#define RPC_cudnnBackendPopulateCudaGraph 1357 +#define RPC_cudnnBackendUpdateCudaGraph 1358 +#define RPC_cudnnCreateTensorDescriptor 1359 +#define RPC_cudnnSetTensor4dDescriptor 1360 +#define RPC_cudnnSetTensor4dDescriptorEx 1361 +#define RPC_cudnnGetTensor4dDescriptor 1362 +#define RPC_cudnnGetTensorSizeInBytes 1363 +#define RPC_cudnnDestroyTensorDescriptor 1364 +#define RPC_cudnnInitTransformDest 1365 +#define RPC_cudnnCreateTensorTransformDescriptor 1366 +#define RPC_cudnnDestroyTensorTransformDescriptor 1367 +#define RPC_cudnnCreateOpTensorDescriptor 1368 +#define RPC_cudnnSetOpTensorDescriptor 1369 +#define RPC_cudnnGetOpTensorDescriptor 1370 +#define RPC_cudnnDestroyOpTensorDescriptor 1371 +#define RPC_cudnnCreateReduceTensorDescriptor 1372 +#define RPC_cudnnSetReduceTensorDescriptor 1373 +#define RPC_cudnnGetReduceTensorDescriptor 1374 +#define RPC_cudnnDestroyReduceTensorDescriptor 1375 +#define RPC_cudnnGetReductionIndicesSize 1376 +#define RPC_cudnnGetReductionWorkspaceSize 1377 +#define RPC_cudnnCreateFilterDescriptor 1378 +#define RPC_cudnnSetFilter4dDescriptor 1379 +#define RPC_cudnnGetFilter4dDescriptor 1380 +#define RPC_cudnnGetFilterSizeInBytes 1381 +#define RPC_cudnnDestroyFilterDescriptor 1382 +#define RPC_cudnnCreatePoolingDescriptor 1383 +#define RPC_cudnnSetPooling2dDescriptor 1384 +#define RPC_cudnnGetPooling2dDescriptor 1385 +#define RPC_cudnnGetPooling2dForwardOutputDim 1386 +#define RPC_cudnnDestroyPoolingDescriptor 1387 +#define RPC_cudnnCreateActivationDescriptor 1388 +#define RPC_cudnnSetActivationDescriptor 1389 +#define RPC_cudnnGetActivationDescriptor 1390 +#define RPC_cudnnSetActivationDescriptorSwishBeta 1391 +#define RPC_cudnnGetActivationDescriptorSwishBeta 1392 +#define RPC_cudnnDestroyActivationDescriptor 1393 +#define RPC_cudnnActivationForward 1394 +#define RPC_cudnnCreateLRNDescriptor 1395 +#define RPC_cudnnSetLRNDescriptor 1396 +#define RPC_cudnnGetLRNDescriptor 1397 +#define RPC_cudnnDestroyLRNDescriptor 1398 +#define RPC_cudnnDeriveBNTensorDescriptor 1399 +#define RPC_cudnnDeriveNormTensorDescriptor 1400 +#define RPC_cudnnCreateSpatialTransformerDescriptor 1401 +#define RPC_cudnnDestroySpatialTransformerDescriptor 1402 +#define RPC_cudnnCreateDropoutDescriptor 1403 +#define RPC_cudnnDestroyDropoutDescriptor 1404 +#define RPC_cudnnDropoutGetStatesSize 1405 +#define RPC_cudnnDropoutGetReserveSpaceSize 1406 +#define RPC_cudnnGetDropoutDescriptor 1407 +#define RPC_cudnnOpsVersionCheck 1408 +#define RPC_cudnnGetBatchNormalizationForwardTrainingExWorkspaceSize 1409 +#define RPC_cudnnGetBatchNormalizationBackwardExWorkspaceSize 1410 +#define RPC_cudnnGetBatchNormalizationTrainingExReserveSpaceSize 1411 +#define RPC_cudnnGetNormalizationForwardTrainingWorkspaceSize 1412 +#define RPC_cudnnGetNormalizationBackwardWorkspaceSize 1413 +#define RPC_cudnnGetNormalizationTrainingReserveSpaceSize 1414 diff --git a/codegen/gen_client.cpp b/codegen/gen_client.cpp index b9979f5..825a212 100644 --- a/codegen/gen_client.cpp +++ b/codegen/gen_client.cpp @@ -18518,6 +18518,63 @@ cudaError_t cudaMemcpyToSymbolAsync(const void *symbol, const void *src, return return_value; } +cudaError_t cudaMemset(void *devPtr, int value, size_t count) { + if (maybe_copy_unified_arg(0, (void *)devPtr, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&value, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&count, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + cudaError_t return_value; + if (rpc_start_request(0, RPC_cudaMemset) < 0 || + rpc_write(0, &devPtr, sizeof(void *)) < 0 || + rpc_write(0, &value, sizeof(int)) < 0 || + rpc_write(0, &count, sizeof(size_t)) < 0 || + rpc_wait_for_response(0) < 0 || rpc_end_response(0, &return_value) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)devPtr, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&value, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&count, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + return return_value; +} + +cudaError_t cudaMemset2D(void *devPtr, size_t pitch, int value, size_t width, + size_t height) { + if (maybe_copy_unified_arg(0, (void *)devPtr, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&pitch, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&value, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&width, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&height, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + cudaError_t return_value; + if (rpc_start_request(0, RPC_cudaMemset2D) < 0 || + rpc_write(0, &devPtr, sizeof(void *)) < 0 || + rpc_write(0, &pitch, sizeof(size_t)) < 0 || + rpc_write(0, &value, sizeof(int)) < 0 || + rpc_write(0, &width, sizeof(size_t)) < 0 || + rpc_write(0, &height, sizeof(size_t)) < 0 || + rpc_wait_for_response(0) < 0 || rpc_end_response(0, &return_value) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)devPtr, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&pitch, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&value, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&width, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&height, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + return return_value; +} + cudaError_t cudaMemset3D(struct cudaPitchedPtr pitchedDevPtr, int value, struct cudaExtent extent) { if (maybe_copy_unified_arg(0, (void *)&pitchedDevPtr, @@ -18544,6 +18601,75 @@ cudaError_t cudaMemset3D(struct cudaPitchedPtr pitchedDevPtr, int value, return return_value; } +cudaError_t cudaMemsetAsync(void *devPtr, int value, size_t count, + cudaStream_t stream) { + if (maybe_copy_unified_arg(0, (void *)devPtr, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&value, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&count, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&stream, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + cudaError_t return_value; + if (rpc_start_request(0, RPC_cudaMemsetAsync) < 0 || + rpc_write(0, &devPtr, sizeof(void *)) < 0 || + rpc_write(0, &value, sizeof(int)) < 0 || + rpc_write(0, &count, sizeof(size_t)) < 0 || + rpc_write(0, &stream, sizeof(cudaStream_t)) < 0 || + rpc_wait_for_response(0) < 0 || rpc_end_response(0, &return_value) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)devPtr, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&value, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&count, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&stream, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + return return_value; +} + +cudaError_t cudaMemset2DAsync(void *devPtr, size_t pitch, int value, + size_t width, size_t height, + cudaStream_t stream) { + if (maybe_copy_unified_arg(0, (void *)devPtr, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&pitch, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&value, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&width, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&height, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&stream, cudaMemcpyHostToDevice) < 0) + return cudaErrorDevicesUnavailable; + cudaError_t return_value; + if (rpc_start_request(0, RPC_cudaMemset2DAsync) < 0 || + rpc_write(0, &devPtr, sizeof(void *)) < 0 || + rpc_write(0, &pitch, sizeof(size_t)) < 0 || + rpc_write(0, &value, sizeof(int)) < 0 || + rpc_write(0, &width, sizeof(size_t)) < 0 || + rpc_write(0, &height, sizeof(size_t)) < 0 || + rpc_write(0, &stream, sizeof(cudaStream_t)) < 0 || + rpc_wait_for_response(0) < 0 || rpc_end_response(0, &return_value) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)devPtr, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&pitch, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&value, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&width, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&height, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + if (maybe_copy_unified_arg(0, (void *)&stream, cudaMemcpyDeviceToHost) < 0) + return cudaErrorDevicesUnavailable; + return return_value; +} + cudaError_t cudaMemset3DAsync(struct cudaPitchedPtr pitchedDevPtr, int value, struct cudaExtent extent, cudaStream_t stream) { if (maybe_copy_unified_arg(0, (void *)&pitchedDevPtr, @@ -53323,7 +53449,11 @@ std::unordered_map functionMap = { {"cudaMemcpyToSymbol", (void *)cudaMemcpyToSymbol}, {"cudaMemcpy2DToArrayAsync", (void *)cudaMemcpy2DToArrayAsync}, {"cudaMemcpyToSymbolAsync", (void *)cudaMemcpyToSymbolAsync}, + {"cudaMemset", (void *)cudaMemset}, + {"cudaMemset2D", (void *)cudaMemset2D}, {"cudaMemset3D", (void *)cudaMemset3D}, + {"cudaMemsetAsync", (void *)cudaMemsetAsync}, + {"cudaMemset2DAsync", (void *)cudaMemset2DAsync}, {"cudaMemset3DAsync", (void *)cudaMemset3DAsync}, {"cudaGetSymbolAddress", (void *)cudaGetSymbolAddress}, {"cudaGetSymbolSize", (void *)cudaGetSymbolSize}, diff --git a/codegen/gen_server.cpp b/codegen/gen_server.cpp index d42ef85..f67db52 100644 --- a/codegen/gen_server.cpp +++ b/codegen/gen_server.cpp @@ -18813,6 +18813,60 @@ int handle_cudaMemcpyToSymbolAsync(void *conn) { return -1; } +int handle_cudaMemset(void *conn) { + void *devPtr; + int value; + size_t count; + int request_id; + cudaError_t scuda_intercept_result; + if (rpc_read(conn, &devPtr, sizeof(void *)) < 0 || + rpc_read(conn, &value, sizeof(int)) < 0 || + rpc_read(conn, &count, sizeof(size_t)) < 0 || false) + goto ERROR_0; + + request_id = rpc_end_request(conn); + if (request_id < 0) + goto ERROR_0; + scuda_intercept_result = cudaMemset(devPtr, value, count); + + if (rpc_start_response(conn, request_id) < 0 || + rpc_end_response(conn, &scuda_intercept_result) < 0) + goto ERROR_0; + + return 0; +ERROR_0: + return -1; +} + +int handle_cudaMemset2D(void *conn) { + void *devPtr; + size_t pitch; + int value; + size_t width; + size_t height; + int request_id; + cudaError_t scuda_intercept_result; + if (rpc_read(conn, &devPtr, sizeof(void *)) < 0 || + rpc_read(conn, &pitch, sizeof(size_t)) < 0 || + rpc_read(conn, &value, sizeof(int)) < 0 || + rpc_read(conn, &width, sizeof(size_t)) < 0 || + rpc_read(conn, &height, sizeof(size_t)) < 0 || false) + goto ERROR_0; + + request_id = rpc_end_request(conn); + if (request_id < 0) + goto ERROR_0; + scuda_intercept_result = cudaMemset2D(devPtr, pitch, value, width, height); + + if (rpc_start_response(conn, request_id) < 0 || + rpc_end_response(conn, &scuda_intercept_result) < 0) + goto ERROR_0; + + return 0; +ERROR_0: + return -1; +} + int handle_cudaMemset3D(void *conn) { struct cudaPitchedPtr pitchedDevPtr; int value; @@ -18838,6 +18892,65 @@ int handle_cudaMemset3D(void *conn) { return -1; } +int handle_cudaMemsetAsync(void *conn) { + void *devPtr; + int value; + size_t count; + cudaStream_t stream; + int request_id; + cudaError_t scuda_intercept_result; + if (rpc_read(conn, &devPtr, sizeof(void *)) < 0 || + rpc_read(conn, &value, sizeof(int)) < 0 || + rpc_read(conn, &count, sizeof(size_t)) < 0 || + rpc_read(conn, &stream, sizeof(cudaStream_t)) < 0 || false) + goto ERROR_0; + + request_id = rpc_end_request(conn); + if (request_id < 0) + goto ERROR_0; + scuda_intercept_result = cudaMemsetAsync(devPtr, value, count, stream); + + if (rpc_start_response(conn, request_id) < 0 || + rpc_end_response(conn, &scuda_intercept_result) < 0) + goto ERROR_0; + + return 0; +ERROR_0: + return -1; +} + +int handle_cudaMemset2DAsync(void *conn) { + void *devPtr; + size_t pitch; + int value; + size_t width; + size_t height; + cudaStream_t stream; + int request_id; + cudaError_t scuda_intercept_result; + if (rpc_read(conn, &devPtr, sizeof(void *)) < 0 || + rpc_read(conn, &pitch, sizeof(size_t)) < 0 || + rpc_read(conn, &value, sizeof(int)) < 0 || + rpc_read(conn, &width, sizeof(size_t)) < 0 || + rpc_read(conn, &height, sizeof(size_t)) < 0 || + rpc_read(conn, &stream, sizeof(cudaStream_t)) < 0 || false) + goto ERROR_0; + + request_id = rpc_end_request(conn); + if (request_id < 0) + goto ERROR_0; + scuda_intercept_result = + cudaMemset2DAsync(devPtr, pitch, value, width, height, stream); + + if (rpc_start_response(conn, request_id) < 0 || + rpc_end_response(conn, &scuda_intercept_result) < 0) + goto ERROR_0; + + return 0; +ERROR_0: + return -1; +} + int handle_cudaMemset3DAsync(void *conn) { struct cudaPitchedPtr pitchedDevPtr; int value; @@ -42837,7 +42950,11 @@ static RequestHandler opHandlers[] = { handle_cudaMemcpyAsync, handle_cudaMemcpy2DToArrayAsync, handle_cudaMemcpyToSymbolAsync, + handle_cudaMemset, + handle_cudaMemset2D, handle_cudaMemset3D, + handle_cudaMemsetAsync, + handle_cudaMemset2DAsync, handle_cudaMemset3DAsync, handle_cudaGetSymbolAddress, handle_cudaGetSymbolSize,