GPU backend
Compare changes
- Praneet Rathi authored
test.jn deleted
100644 → 0
+ 0
− 752
fn Conv2d<t:number, m:usize, n:usize, p:usize, q:usize, r:usize, s:usize, u:usize, v:usize, w:usize, stride1:usize, stride2:usize, padding1:usize, padding2:usize, dilation1:usize, dilation2:usize, output_padding1:usize, output_padding2:usize, groups:usize>(X: t[m, n, p, q], W: t[r, n, s, u]) -> t[m, r, v, w] {
fn main(arg0_1: f32[32, 1, 3, 3], arg1_1: f32[32], arg2_1: f32[32], arg3_1: f32[32, 1, 3, 3], arg4_1: f32[32], arg5_1: f32[32], arg6_1: f32[16, 32, 1, 1], arg7_1: f32[16], arg8_1: f32[16], arg9_1: f32[96, 16, 1, 1], arg10_1: f32[96], arg11_1: f32[96], arg12_1: f32[96, 1, 3, 3], arg13_1: f32[96], arg14_1: f32[96], arg15_1: f32[24, 96, 1, 1], arg16_1: f32[24], arg17_1: f32[24], arg18_1: f32[144, 24, 1, 1], arg19_1: f32[144], arg20_1: f32[144], arg21_1: f32[144, 1, 3, 3], arg22_1: f32[144], arg23_1: f32[144], arg24_1: f32[24, 144, 1, 1], arg25_1: f32[24], arg26_1: f32[24], arg27_1: f32[144, 24, 1, 1], arg28_1: f32[144], arg29_1: f32[144], arg30_1: f32[144, 1, 3, 3], arg31_1: f32[144], arg32_1: f32[144], arg33_1: f32[32, 144, 1, 1], arg34_1: f32[32], arg35_1: f32[32], arg36_1: f32[192, 32, 1, 1], arg37_1: f32[192], arg38_1: f32[192], arg39_1: f32[192, 1, 3, 3], arg40_1: f32[192], arg41_1: f32[192], arg42_1: f32[32, 192, 1, 1], arg43_1: f32[32], arg44_1: f32[32], arg45_1: f32[192, 32, 1, 1], arg46_1: f32[192], arg47_1: f32[192], arg48_1: f32[192, 1, 3, 3], arg49_1: f32[192], arg50_1: f32[192], arg51_1: f32[32, 192, 1, 1], arg52_1: f32[32], arg53_1: f32[32], arg54_1: f32[192, 32, 1, 1], arg55_1: f32[192], arg56_1: f32[192], arg57_1: f32[192, 1, 3, 3], arg58_1: f32[192], arg59_1: f32[192], arg60_1: f32[64, 192, 1, 1], arg61_1: f32[64], arg62_1: f32[64], arg63_1: f32[384, 64, 1, 1], arg64_1: f32[384], arg65_1: f32[384], arg66_1: f32[384, 1, 3, 3], arg67_1: f32[384], arg68_1: f32[384], arg69_1: f32[64, 384, 1, 1], arg70_1: f32[64], arg71_1: f32[64], arg72_1: f32[384, 64, 1, 1], arg73_1: f32[384], arg74_1: f32[384], arg75_1: f32[384, 1, 3, 3], arg76_1: f32[384], arg77_1: f32[384], arg78_1: f32[64, 384, 1, 1], arg79_1: f32[64], arg80_1: f32[64], arg81_1: f32[384, 64, 1, 1], arg82_1: f32[384], arg83_1: f32[384], arg84_1: f32[384, 1, 3, 3], arg85_1: f32[384], arg86_1: f32[384], arg87_1: f32[64, 384, 1, 1], arg88_1: f32[64], arg89_1: f32[64], arg90_1: f32[384, 64, 1, 1], arg91_1: f32[384], arg92_1: f32[384], arg93_1: f32[384, 1, 3, 3], arg94_1: f32[384], arg95_1: f32[384], arg96_1: f32[96, 384, 1, 1], arg97_1: f32[96], arg98_1: f32[96], arg99_1: f32[576, 96, 1, 1], arg100_1: f32[576], arg101_1: f32[576], arg102_1: f32[576, 1, 3, 3], arg103_1: f32[576], arg104_1: f32[576], arg105_1: f32[96, 576, 1, 1], arg106_1: f32[96], arg107_1: f32[96], arg108_1: f32[576, 96, 1, 1], arg109_1: f32[576], arg110_1: f32[576], arg111_1: f32[576, 1, 3, 3], arg112_1: f32[576], arg113_1: f32[576], arg114_1: f32[96, 576, 1, 1], arg115_1: f32[96], arg116_1: f32[96], arg117_1: f32[576, 96, 1, 1], arg118_1: f32[576], arg119_1: f32[576], arg120_1: f32[576, 1, 3, 3], arg121_1: f32[576], arg122_1: f32[576], arg123_1: f32[160, 576, 1, 1], arg124_1: f32[160], arg125_1: f32[160], arg126_1: f32[960, 160, 1, 1], arg127_1: f32[960], arg128_1: f32[960], arg129_1: f32[960, 1, 3, 3], arg130_1: f32[960], arg131_1: f32[960], arg132_1: f32[160, 960, 1, 1], arg133_1: f32[160], arg134_1: f32[160], arg135_1: f32[960, 160, 1, 1], arg136_1: f32[960], arg137_1: f32[960], arg138_1: f32[960, 1, 3, 3], arg139_1: f32[960], arg140_1: f32[960], arg141_1: f32[160, 960, 1, 1], arg142_1: f32[160], arg143_1: f32[160], arg144_1: f32[960, 160, 1, 1], arg145_1: f32[960], arg146_1: f32[960], arg147_1: f32[960, 1, 3, 3], arg148_1: f32[960], arg149_1: f32[960], arg150_1: f32[320, 960, 1, 1], arg151_1: f32[320], arg152_1: f32[320], arg153_1: f32[1280, 320, 1, 1], arg154_1: f32[1280], arg155_1: f32[1280], arg156_1: f32[10, 1280], arg157_1: f32[10], arg158_1: f32[32], arg159_1: f32[32], arg160_1: i64[], arg161_1: f32[32], arg162_1: f32[32], arg163_1: i64[], arg164_1: f32[16], arg165_1: f32[16], arg166_1: i64[], arg167_1: f32[96], arg168_1: f32[96], arg169_1: i64[], arg170_1: f32[96], arg171_1: f32[96], arg172_1: i64[], arg173_1: f32[24], arg174_1: f32[24], arg175_1: i64[], arg176_1: f32[144], arg177_1: f32[144], arg178_1: i64[], arg179_1: f32[144], arg180_1: f32[144], arg181_1: i64[], arg182_1: f32[24], arg183_1: f32[24], arg184_1: i64[], arg185_1: f32[144], arg186_1: f32[144], arg187_1: i64[], arg188_1: f32[144], arg189_1: f32[144], arg190_1: i64[], arg191_1: f32[32], arg192_1: f32[32], arg193_1: i64[], arg194_1: f32[192], arg195_1: f32[192], arg196_1: i64[], arg197_1: f32[192], arg198_1: f32[192], arg199_1: i64[], arg200_1: f32[32], arg201_1: f32[32], arg202_1: i64[], arg203_1: f32[192], arg204_1: f32[192], arg205_1: i64[], arg206_1: f32[192], arg207_1: f32[192], arg208_1: i64[], arg209_1: f32[32], arg210_1: f32[32], arg211_1: i64[], arg212_1: f32[192], arg213_1: f32[192], arg214_1: i64[], arg215_1: f32[192], arg216_1: f32[192], arg217_1: i64[], arg218_1: f32[64], arg219_1: f32[64], arg220_1: i64[], arg221_1: f32[384], arg222_1: f32[384], arg223_1: i64[], arg224_1: f32[384], arg225_1: f32[384], arg226_1: i64[], arg227_1: f32[64], arg228_1: f32[64], arg229_1: i64[], arg230_1: f32[384], arg231_1: f32[384], arg232_1: i64[], arg233_1: f32[384], arg234_1: f32[384], arg235_1: i64[], arg236_1: f32[64], arg237_1: f32[64], arg238_1: i64[], arg239_1: f32[384], arg240_1: f32[384], arg241_1: i64[], arg242_1: f32[384], arg243_1: f32[384], arg244_1: i64[], arg245_1: f32[64], arg246_1: f32[64], arg247_1: i64[], arg248_1: f32[384], arg249_1: f32[384], arg250_1: i64[], arg251_1: f32[384], arg252_1: f32[384], arg253_1: i64[], arg254_1: f32[96], arg255_1: f32[96], arg256_1: i64[], arg257_1: f32[576], arg258_1: f32[576], arg259_1: i64[], arg260_1: f32[576], arg261_1: f32[576], arg262_1: i64[], arg263_1: f32[96], arg264_1: f32[96], arg265_1: i64[], arg266_1: f32[576], arg267_1: f32[576], arg268_1: i64[], arg269_1: f32[576], arg270_1: f32[576], arg271_1: i64[], arg272_1: f32[96], arg273_1: f32[96], arg274_1: i64[], arg275_1: f32[576], arg276_1: f32[576], arg277_1: i64[], arg278_1: f32[576], arg279_1: f32[576], arg280_1: i64[], arg281_1: f32[160], arg282_1: f32[160], arg283_1: i64[], arg284_1: f32[960], arg285_1: f32[960], arg286_1: i64[], arg287_1: f32[960], arg288_1: f32[960], arg289_1: i64[], arg290_1: f32[160], arg291_1: f32[160], arg292_1: i64[], arg293_1: f32[960], arg294_1: f32[960], arg295_1: i64[], arg296_1: f32[960], arg297_1: f32[960], arg298_1: i64[], arg299_1: f32[160], arg300_1: f32[160], arg301_1: i64[], arg302_1: f32[960], arg303_1: f32[960], arg304_1: i64[], arg305_1: f32[960], arg306_1: f32[960], arg307_1: i64[], arg308_1: f32[320], arg309_1: f32[320], arg310_1: i64[], arg311_1: f32[1280], arg312_1: f32[1280], arg313_1: i64[], arg314_1: f32[1, 1, 28, 28]) -> (f32[1, 10]) {