Created
June 19, 2025 00:43
-
-
Save shunting314/ae6594e234a5d35943873a0bd7e58278 to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
dev,name,batch_size,speedup,abs_latency,compilation_latency,compression_ratio,eager_peak_mem,dynamo_peak_mem,calls_captured,unique_graphs,graph_breaks,unique_graph_breaks,autograd_captures,autograd_compiles,cudagraph_skips | |
cuda,AlbertForQuestionAnswering,4,1.852471,56.497508,24.829062,1.739568,13.134039,7.550172,551,2,6,5,0,0,0 | |
cuda,AlbertForQuestionAnswering,4,1.798106,58.392157,25.367629,1.636454,13.134039,8.025914,551,2,6,5,0,0,0 | |
cuda,AlbertForQuestionAnswering,4,1.853116,56.697391,24.828594,1.739568,13.134039,7.550172,551,2,6,5,0,0,0 | |
cuda,AlbertForQuestionAnswering,4,1.794527,58.544738,25.522933,1.636454,13.134039,8.025914,551,2,6,5,0,0,0 | |
cuda,AlbertForQuestionAnswering,4,1.851322,56.775110,25.294649,1.739568,13.134039,7.550172,551,2,6,5,0,0,0 | |
cuda,AlbertForQuestionAnswering,4,1.797679,58.396403,25.496219,1.636454,13.134039,8.025914,551,2,6,5,0,0,0 | |
cuda,BertForQuestionAnswering,16,1.225475,25.869646,42.943145,1.092308,5.395956,4.939960,1347,2,6,5,0,0,0 | |
cuda,BertForQuestionAnswering,16,1.204907,26.294820,42.214650,1.092221,5.395956,4.940353,1347,2,6,5,0,0,0 | |
cuda,BertForQuestionAnswering,16,1.226961,26.179861,42.043055,1.092482,5.395956,4.939173,1347,2,6,5,0,0,0 | |
cuda,BertForQuestionAnswering,16,1.206214,26.300689,40.537534,1.092221,5.395956,4.940353,1347,2,6,5,0,0,0 | |
cuda,BertForQuestionAnswering,16,1.222706,25.936532,41.258963,1.092482,5.395956,4.939173,1347,2,6,5,0,0,0 | |
cuda,BertForQuestionAnswering,16,1.212368,26.533147,41.623621,1.092221,5.395956,4.940353,1347,2,6,5,0,0,0 | |
cuda,ElectraForQuestionAnswering,64,3.754523,20.174963,46.326723,2.396695,10.570966,4.410643,1453,2,6,5,0,0,0 | |
cuda,ElectraForQuestionAnswering,64,3.748277,20.188388,43.730340,2.396695,10.570966,4.410643,1453,2,6,5,0,0,0 | |
cuda,ElectraForQuestionAnswering,64,3.688690,20.556087,45.990228,2.396695,10.570966,4.410643,1453,2,6,5,0,0,0 | |
cuda,ElectraForQuestionAnswering,64,3.712017,20.423530,44.589959,2.396695,10.570966,4.410643,1453,2,6,5,0,0,0 | |
cuda,ElectraForQuestionAnswering,64,3.741652,20.236816,45.007310,2.396695,10.570966,4.410643,1453,2,6,5,0,0,0 | |
cuda,ElectraForQuestionAnswering,64,3.666431,20.725799,45.476170,2.396695,10.570966,4.410643,1453,2,6,5,0,0,0 | |
cuda,GPT2ForSequenceClassification,4,2.706283,12.750462,56.384880,1.575609,6.002288,3.809503,1962,3,7,5,0,0,0 | |
cuda,GPT2ForSequenceClassification,4,2.594032,13.328177,57.485921,1.575160,6.000059,3.809176,1962,3,7,5,0,0,0 | |
cuda,GPT2ForSequenceClassification,4,2.668007,12.980574,57.427639,1.575729,6.000059,3.807799,1962,3,7,5,0,0,0 | |
cuda,GPT2ForSequenceClassification,4,2.604990,13.250499,55.648442,1.575745,6.002288,3.809176,1962,3,7,5,0,0,0 | |
cuda,GPT2ForSequenceClassification,4,2.706866,12.799780,55.551793,1.576314,6.002288,3.807799,1962,3,7,5,0,0,0 | |
cuda,GPT2ForSequenceClassification,4,2.615950,13.194679,56.253762,1.575160,6.000059,3.809176,1962,3,7,5,0,0,0 | |
cuda,GoogleFnet,16,1.923126,33.220521,25.188736,2.123714,12.856360,6.053715,791,2,6,5,0,0,0 | |
cuda,GoogleFnet,16,1.916119,33.187140,23.662219,2.123300,12.856360,6.054895,791,2,6,5,0,0,0 | |
cuda,GoogleFnet,16,1.924351,33.046211,24.222188,2.123714,12.856360,6.053715,791,2,6,5,0,0,0 | |
cuda,GoogleFnet,16,1.892251,33.791873,25.199200,2.123300,12.856360,6.054895,791,2,6,5,0,0,0 | |
cuda,GoogleFnet,16,1.923421,33.082381,24.339341,2.123714,12.856360,6.053715,791,2,6,5,0,0,0 | |
cuda,GoogleFnet,16,1.897158,33.678000,25.597570,2.123300,12.856360,6.054895,791,2,6,5,0,0,0 | |
cuda,LayoutLMForMaskedLM,16,2.734762,25.898520,52.663815,2.043902,12.648872,6.188590,1497,2,6,5,0,0,0 | |
cuda,LayoutLMForMaskedLM,16,2.690863,26.289461,46.932117,2.044422,12.648872,6.187017,1497,2,6,5,0,0,0 | |
cuda,LayoutLMForMaskedLM,16,2.732458,25.852459,47.199227,2.044422,12.648872,6.187017,1497,2,6,5,0,0,0 | |
cuda,LayoutLMForMaskedLM,16,2.729872,25.802954,44.019661,2.044422,12.648872,6.187017,1497,2,6,5,0,0,0 | |
cuda,LayoutLMForMaskedLM,16,2.738789,25.788037,47.981004,2.044422,12.648872,6.187017,1497,2,6,5,0,0,0 | |
cuda,LayoutLMForMaskedLM,16,2.721155,25.968275,46.466488,2.044422,12.648872,6.187017,1497,2,6,5,0,0,0 | |
cuda,LayoutLMForSequenceClassification,16,2.898829,21.344006,78.566119,1.915030,9.843389,5.140070,1936,3,7,5,0,0,0 | |
cuda,LayoutLMForSequenceClassification,16,2.864214,21.580250,74.603807,1.914810,9.843389,5.140660,1936,3,7,5,0,0,0 | |
cuda,LayoutLMForSequenceClassification,16,2.946324,20.864058,69.597888,1.915030,9.843389,5.140070,1936,3,7,5,0,0,0 | |
cuda,LayoutLMForSequenceClassification,16,2.878415,21.366114,70.495472,1.914810,9.843389,5.140660,1936,3,7,5,0,0,0 | |
cuda,LayoutLMForSequenceClassification,16,2.905646,21.248846,73.756330,1.915030,9.843389,5.140070,1936,3,7,5,0,0,0 | |
cuda,LayoutLMForSequenceClassification,16,2.901617,21.250625,70.461364,1.914810,9.843389,5.140660,1936,3,7,5,0,0,0 | |
cuda,MobileBertForMaskedLM,128,2.579698,43.824341,98.913415,1.669544,14.059843,8.421369,1546,1,4,4,0,0,0 | |
cuda,MobileBertForMaskedLM,128,2.560593,43.755315,101.527214,1.669544,14.059843,8.421369,1546,1,4,4,0,0,0 | |
cuda,MobileBertForMaskedLM,128,2.544096,44.110358,95.394764,1.682058,14.059843,8.358717,1546,1,4,4,0,0,0 | |
cuda,MobileBertForMaskedLM,128,2.581275,43.873745,103.010425,1.682058,14.059843,8.358716,1546,1,4,4,0,0,0 | |
cuda,MobileBertForMaskedLM,128,2.554853,43.507945,92.950048,1.682058,14.059843,8.358717,1546,1,4,4,0,0,0 | |
cuda,MobileBertForMaskedLM,128,2.605591,41.523625,98.852894,1.682058,14.059843,8.358716,1546,1,4,4,0,0,0 | |
cuda,MobileBertForQuestionAnswering,128,2.990429,36.403690,96.236398,1.291882,8.091555,6.263383,1550,1,4,4,0,0,0 | |
cuda,MobileBertForQuestionAnswering,128,2.828594,34.247619,96.801123,1.302391,8.091555,6.212846,1550,1,4,4,0,0,0 | |
cuda,MobileBertForQuestionAnswering,128,2.889346,34.319027,87.981884,1.302391,8.091555,6.212846,1550,1,4,4,0,0,0 | |
cuda,MobileBertForQuestionAnswering,128,3.093854,32.528672,100.237272,1.302391,8.091555,6.212846,1550,1,4,4,0,0,0 | |
cuda,MobileBertForQuestionAnswering,128,2.894725,34.416331,93.237315,1.302391,8.091555,6.212846,1550,1,4,4,0,0,0 | |
cuda,MobileBertForQuestionAnswering,128,3.001292,35.797911,100.677535,1.302391,8.091555,6.212846,1550,1,4,4,0,0,0 | |
cuda,RobertaForQuestionAnswering,16,1.267716,26.395635,40.630853,1.087763,5.638196,5.183295,1354,2,6,5,0,0,0 | |
cuda,RobertaForQuestionAnswering,16,1.233684,26.728483,41.853530,1.087680,5.638196,5.183688,1354,2,6,5,0,0,0 | |
cuda,RobertaForQuestionAnswering,16,1.257918,26.399454,42.872596,1.087928,5.638196,5.182509,1354,2,6,5,0,0,0 | |
cuda,RobertaForQuestionAnswering,16,1.231518,26.605787,41.548511,1.087680,5.638196,5.183688,1354,2,6,5,0,0,0 | |
cuda,RobertaForQuestionAnswering,16,1.249526,26.160010,42.560193,1.087928,5.638196,5.182509,1354,2,6,5,0,0,0 | |
cuda,RobertaForQuestionAnswering,16,1.229170,26.228034,40.188131,1.087680,5.638196,5.183688,1354,2,6,5,0,0,0 | |
cuda,T5ForConditionalGeneration,4,1.536465,41.299229,58.679564,1.356455,8.785276,6.476642,1500,7,9,6,0,0,0 | |
cuda,T5ForConditionalGeneration,4,1.555096,40.760083,50.162359,1.356455,8.785276,6.476642,1500,7,9,6,0,0,0 | |
cuda,T5ForConditionalGeneration,4,1.528533,41.333984,54.146340,1.356455,8.785276,6.476642,1500,7,9,6,0,0,0 | |
cuda,T5ForConditionalGeneration,4,1.543496,41.083038,54.260598,1.356455,8.785276,6.476642,1500,7,9,6,0,0,0 | |
cuda,T5ForConditionalGeneration,4,1.530864,41.193400,54.557646,1.356455,8.785276,6.476642,1500,7,9,6,0,0,0 | |
cuda,T5ForConditionalGeneration,4,1.549753,41.090674,55.561973,1.356455,8.785276,6.476642,1500,7,9,6,0,0,0 |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment