Skip to content
Snippets Groups Projects
Commit 8db8c1eb authored by Hashim Sharif's avatar Hashim Sharif
Browse files

removing more unused commented code

parent 6e70be1c
No related branches found
No related tags found
No related merge requests found
...@@ -471,33 +471,15 @@ void sampleFilter2(Tensor* newFilter, Tensor* filter, ...@@ -471,33 +471,15 @@ void sampleFilter2(Tensor* newFilter, Tensor* filter,
int N = n * c * h * w; int N = n * c * h * w;
float mul_factor; float mul_factor;
/*if (interpolation_id == 0){
mul_factor = (skip_rate * 1.0) / (skip_rate - 1);
}
else if (interpolation_id == 1){
mul_factor = (skip_rate * 1.0) / (skip_rate - 1);
mul_factor = (mul_factor + 1.0) / 2;
}
*/
//printf ("interpolation_rate = %f \n", interpolation_rate);
mul_factor = (skip_rate * 1.0) / (skip_rate - 1); mul_factor = (skip_rate * 1.0) / (skip_rate - 1);
mul_factor = 1 + (interpolation_rate * (mul_factor - 1.0)); mul_factor = 1 + (interpolation_rate * (mul_factor - 1.0));
printf ("mul_factor = %f \n", mul_factor);
DEBUG ("mul_factor = %f \n", mul_factor); DEBUG ("mul_factor = %f \n", mul_factor);
sampleFilterElems<<<numBlocks,128>>>(N, sampleFilterElems<<<numBlocks,128>>>(N,
n, c, h, w, n, c, h, w,
(float *) filter->gpu_data, (float *) filter->gpu_data,
skip_rate, skip_offset, mul_factor, skip_rate, skip_offset, mul_factor,
(float *) newFilter->gpu_data); (float *) newFilter->gpu_data);
} }
...@@ -943,6 +925,8 @@ int getSwing(int swing){ ...@@ -943,6 +925,8 @@ int getSwing(int swing){
void initializeAutotuner(){ void initializeAutotuner(){
printf("initializing tuner .... \n");
sampParamSet = new SampParamSet; sampParamSet = new SampParamSet;
perfParamSet = new PerfParamSet; perfParamSet = new PerfParamSet;
} }
......
...@@ -240,42 +240,5 @@ void hgemm(const float * const __restrict__ af, ...@@ -240,42 +240,5 @@ void hgemm(const float * const __restrict__ af,
} }
/*int main() {
const unsigned num_rows_a = 5000 * 14 * 14;
const unsigned num_cols_a = 800;
const unsigned num_rows_b = num_cols_a;
const unsigned num_cols_b = 64;
const unsigned num_elements_a = num_rows_a * num_cols_a;
const unsigned num_elements_b = num_rows_b * num_cols_b;
const unsigned num_elements_c = num_rows_a * num_cols_b;
float *a;
float *b;
float *c;
checkCuda(cudaMallocManaged(&a, sizeof(float) * num_elements_a));
checkCuda(cudaMallocManaged(&b, sizeof(float) * num_elements_b));
checkCuda(cudaMallocManaged(&c, sizeof(float) * num_elements_c));
init(a, num_elements_a);
init(b, num_elements_b);
init(c, num_elements_c);
// FP32
sgemm(a, num_rows_a, num_cols_a, b, num_rows_b, num_cols_b, c);
printArray(c, 16);
// FP16
hgemm(a, num_rows_a, num_cols_a, b, num_rows_b, num_cols_b, c);
printArray(c, 16);
checkCuda(cudaFree(a));
checkCuda(cudaFree(b));
checkCuda(cudaFree(c));
return 0;
}
*/
#endif #endif
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment