add zeropadding function

yester31 · Jul 23, 2021 · a3cbe88 · a3cbe88
1 parent 0395385
commit a3cbe88
Show file tree

Hide file tree

Showing 41 changed files with 523 additions and 8 deletions.
diff --git a/Calc_Validation/.idea/.gitignore b/Calc_Validation/.idea/.gitignore
diff --git a/Calc_Validation/.idea/Calc_Validation.iml b/Calc_Validation/.idea/Calc_Validation.iml
diff --git a/Calc_Validation/.idea/inspectionProfiles/profiles_settings.xml b/Calc_Validation/.idea/inspectionProfiles/profiles_settings.xml
diff --git a/Calc_Validation/.idea/misc.xml b/Calc_Validation/.idea/misc.xml
diff --git a/Calc_Validation/.idea/modules.xml b/Calc_Validation/.idea/modules.xml
diff --git a/Calc_Validation/.idea/vcs.xml b/Calc_Validation/.idea/vcs.xml
diff --git a/Calc_Validation/__pycache__/compare.cpython-37.pyc b/Calc_Validation/__pycache__/compare.cpython-37.pyc
diff --git a/Calc_Validation/compare.py b/Calc_Validation/compare.py
@@ -0,0 +1,26 @@
+
+def compare_two_tensor(output, output_c):
+    if len(output) != len(output_c):
+        print("Tensor size is not same : output=%d  output_c=%d" % (len(output), len(output_c)))
+        exit()
+
+    max_idx = -1
+    max_diff = 0
+    cnt_diff = 0
+    r0 = 0
+    r = 0
+    for idx in range(len(output)):
+        if output[idx] != output_c[idx]:
+            cnt_diff += 1
+            diff = abs(output[idx] - output_c[idx])
+            if diff > max_diff:
+                max_diff = diff
+                max_idx = idx
+                r0 = output[idx]
+                r = output_c[idx]
+            print("%6d output=%10.6f output_c=%10.6f diff=%.6f" % (idx, output[idx], output_c[idx], diff))
+    if max_diff > 0:
+        print("cnt_total=%d cnt_diff=%d max_idx=%6d output=%10.6f output_c=%10.6f diff=%.6f" % (
+        len(output), cnt_diff, max_idx, r0, r, max_diff))
+    else:
+        print("prefect match and done!")
diff --git a/Calc_Validation/tt.py → Calc_Validation/conv2d.py b/Calc_Validation/tt.py → Calc_Validation/conv2d.py
@@ -1,9 +1,10 @@
 import torch # v1.8.0
 import numpy as np
+from compare import *
 
-OC = 1
-IN = 1
-IC = 1
+OC = 3
+IN = 2
+IC = 2
 IH = 4
 IW = 4
 KH = 3
@@ -20,4 +21,9 @@
 conservertive_convolution.weight = torch.nn.Parameter(weight)
 
 output = conservertive_convolution(input)
-print(output)
+print(output)
+
+output_c = np.fromfile("../output/C_Tensor", dtype=np.float32)
+output_py = output.detach().numpy().flatten()
+
+compare_two_tensor(output_py, output_c)
diff --git a/Calc_Validation/conv2d_with_padding.py b/Calc_Validation/conv2d_with_padding.py
@@ -0,0 +1,37 @@
+import torch # v1.8.0
+import numpy as np
+from compare import *
+
+OC = 3
+IN = 2
+IC = 2
+IH = 4
+IW = 4
+KH = 3
+KW = 3
+TP = 1
+BP = 2
+LP = 3
+RP = 4
+
+weight = torch.ones([OC, IC, KH, KW], dtype=torch.float32, requires_grad=False)
+print(weight)
+
+input_np = np.arange(1, IN * IC * IH * IW + 1).reshape(IN, IC, IH, IW)
+input = torch.from_numpy(input_np).type(torch.FloatTensor)
+print(input)
+
+p2d = (LP, RP, TP, BP)
+input_padded = torch.nn.functional.pad(input, p2d, "constant", 0)
+print(input_padded)
+
+conservertive_convolution = torch.nn.Conv2d(IC, OC, (KH, KH), stride=(1, 1), bias=False)
+conservertive_convolution.weight = torch.nn.Parameter(weight)
+
+output = conservertive_convolution(input_padded)
+print(output)
+
+output_c = np.fromfile("../output/C_Tensor_zp", dtype=np.float32)
+output_py = output.detach().numpy().flatten()
+
+compare_two_tensor(output_py, output_c)
diff --git a/Conservertive_Convolution/.vs/Conservertive_Convolution/v15/.suo b/Conservertive_Convolution/.vs/Conservertive_Convolution/v15/.suo
diff --git a/Conservertive_Convolution/.vs/Conservertive_Convolution/v15/Browse.VC.db b/Conservertive_Convolution/.vs/Conservertive_Convolution/v15/Browse.VC.db
diff --git a/Conservertive_Convolution/Conservertive_Convolution/Conservertive_Convolution.cpp b/Conservertive_Convolution/Conservertive_Convolution/Conservertive_Convolution.cpp
@@ -100,7 +100,7 @@ void scalarTensor(vector<float>& output, int OC, int IC, int KH, int KW, float s
 	}
 }
 
-void tofile(vector<float> &Buffer, string fname = "C_Tensor") {
+void tofile(vector<float> &Buffer, string fname = "../../output/C_Tensor") {
 	std::ofstream fs(fname, ios::binary);
 	if (fs.is_open())
 		fs.write((const char*)Buffer.data(), Buffer.size() * sizeof(float));
@@ -109,9 +109,9 @@ void tofile(vector<float> &Buffer, string fname = "C_Tensor") {
 
 int main()
 {
-	int OC = 1;
-	int IC = 1;
-	int IN = 1;
+	int OC = 3;
+	int IC = 2;
+	int IN = 2;
 	int IH = 4;
 	int IW = 4;
 	int KH = 3;

diff --git a/...e_Convolution/Conservertive_Convolution/x64/Debug/Conserve.8C10F35D.tlog/link.read.1.tlog b/...e_Convolution/Conservertive_Convolution/x64/Debug/Conserve.8C10F35D.tlog/link.read.1.tlog
diff --git a/Conservertive_Convolution/Conservertive_Convolution/x64/Debug/vc141.idb b/Conservertive_Convolution/Conservertive_Convolution/x64/Debug/vc141.idb
diff --git a/Conservertive_Convolution/Conservertive_Convolution/x64/Debug/vc141.pdb b/Conservertive_Convolution/Conservertive_Convolution/x64/Debug/vc141.pdb
diff --git a/Conservertive_Convolution/x64/Debug/Conservertive_Convolution.ilk b/Conservertive_Convolution/x64/Debug/Conservertive_Convolution.ilk
diff --git a/Conservertive_Convolution/x64/Debug/Conservertive_Convolution.pdb b/Conservertive_Convolution/x64/Debug/Conservertive_Convolution.pdb
diff --git a/Conservertive_Convolution_with_padding/.vs/Conservertive_Convolution_with_padding/v15/.suo b/Conservertive_Convolution_with_padding/.vs/Conservertive_Convolution_with_padding/v15/.suo
diff --git a/...tive_Convolution_with_padding/.vs/Conservertive_Convolution_with_padding/v15/Browse.VC.db b/...tive_Convolution_with_padding/.vs/Conservertive_Convolution_with_padding/v15/Browse.VC.db
diff --git a/...ith_padding/v15/ipch/AutoPCH/cf6205ca1d479a70/CONSERVERTIVE_CONVOLUTION_WITH_PADDING.ipch b/...ith_padding/v15/ipch/AutoPCH/cf6205ca1d479a70/CONSERVERTIVE_CONVOLUTION_WITH_PADDING.ipch
diff --git a/Conservertive_Convolution_with_padding/Conservertive_Convolution_with_padding.sln b/Conservertive_Convolution_with_padding/Conservertive_Convolution_with_padding.sln
@@ -0,0 +1,31 @@
+
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio 15
+VisualStudioVersion = 15.0.28307.1209
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "Conservertive_Convolution_with_padding", "Conservertive_Convolution_with_padding\Conservertive_Convolution_with_padding.vcxproj", "{4833BF3A-1547-4A3C-A1A6-5C952F174486}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|x64 = Debug|x64
+		Debug|x86 = Debug|x86
+		Release|x64 = Release|x64
+		Release|x86 = Release|x86
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{4833BF3A-1547-4A3C-A1A6-5C952F174486}.Debug|x64.ActiveCfg = Debug|x64
+		{4833BF3A-1547-4A3C-A1A6-5C952F174486}.Debug|x64.Build.0 = Debug|x64
+		{4833BF3A-1547-4A3C-A1A6-5C952F174486}.Debug|x86.ActiveCfg = Debug|Win32
+		{4833BF3A-1547-4A3C-A1A6-5C952F174486}.Debug|x86.Build.0 = Debug|Win32
+		{4833BF3A-1547-4A3C-A1A6-5C952F174486}.Release|x64.ActiveCfg = Release|x64
+		{4833BF3A-1547-4A3C-A1A6-5C952F174486}.Release|x64.Build.0 = Release|x64
+		{4833BF3A-1547-4A3C-A1A6-5C952F174486}.Release|x86.ActiveCfg = Release|Win32
+		{4833BF3A-1547-4A3C-A1A6-5C952F174486}.Release|x86.Build.0 = Release|Win32
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+	GlobalSection(ExtensibilityGlobals) = postSolution
+		SolutionGuid = {69E503E3-64A0-4840-AD53-1D5332013285}
+	EndGlobalSection
+EndGlobal
diff --git a/...padding/Conservertive_Convolution_with_padding/Conservertive_Convolution_with_padding.cpp b/...padding/Conservertive_Convolution_with_padding/Conservertive_Convolution_with_padding.cpp
@@ -0,0 +1,187 @@
+// 2021-7-22 by YH PARK
+
+#include <iostream>
+#include <string>
+#include <vector>
+#include <random>
+#include <chrono>
+#include <iomanip>
+#include<fstream>
+using namespace std;
+using namespace chrono;
+
+/***************************************************************************
+	Conservertive Convolution algotirhm (with zeropadding option)
+****************************************************************************/
+
+void zeroPadding(vector<float>& output, vector<float>& input, int IN, int IC, int IH, int IW, int TP, int BP, int LP, int RP) {
+	cout << "===== Zero Padding ===== \n";
+
+	int C_offset_i, C_offset_o,
+		H_offset_i, H_offset_o,
+		W_offset_i, W_offset_o,
+		⁠g_idx_i, g_idx_o;
+	int N_offset_i = IC * IH * IW;
+	int N_offset_o = IC * (IH + TP + BP) * (IW + LP + RP);
+	for (int ⁠n_idx = 0; ⁠n_idx < IN; ⁠n_idx++){
+		C_offset_i = ⁠n_idx * N_offset_i;
+		C_offset_o = ⁠n_idx * N_offset_o;
+		for (int ⁠c_idx = 0; ⁠c_idx < IC; ⁠c_idx++){
+			H_offset_i = ⁠c_idx * IH * IW  + C_offset_i;
+			H_offset_o = ⁠c_idx * (IH + TP + BP) * (IW + LP + RP) + C_offset_o;
+			for (int ⁠h_idx = 0; ⁠h_idx < IH; ⁠h_idx++){
+				W_offset_i = ⁠h_idx * IW + H_offset_i;
+				W_offset_o = (⁠h_idx + TP) * (IW + LP + RP) + LP + H_offset_o;
+				for (int w_idx = 0; w_idx < IW; w_idx++){
+					⁠g_idx_i = w_idx + W_offset_i;
+					g_idx_o = w_idx + W_offset_o;
+					output[g_idx_o] = input[⁠g_idx_i];
+				}
+			}
+		}
+	}
+}
+
+
+void convolution(vector<float>& output, vector<float>& input, vector<float>& weight, int KH, int KW, int stride, int IN, int IC, int IH, int IW, int OC) {
+	std::cout << "===== Convolution ===== \n" << std::endl;
+
+	int OH = ((IH - KH) / stride) + 1;
+	int OW = ((IW - KW) / stride) + 1;
+	int C_offset_i, C_offset_o, C_offset_k,
+		H_offset_i, H_offset_o, H_offset_k,
+		W_offset_i, W_offset_o, W_offset_k,
+		⁠g_idx_i, g_idx_o, g_idx_k;
+	int N_offset_i = IC * IH * IW;
+	int N_offset_o = OC * OH * OW;
+	int N_offset_k = IC * KH * KW;
+	for (int ⁠n_idx = 0; ⁠n_idx < IN; ⁠n_idx++) {
+		C_offset_i = ⁠n_idx * N_offset_i;
+		C_offset_o = ⁠n_idx * N_offset_o;
+		for (int k_idx = 0; k_idx < OC; k_idx++) {
+			C_offset_k = k_idx * N_offset_k;
+			H_offset_o = k_idx * OH * OW + C_offset_o;
+			for (int ⁠c_idx = 0; ⁠c_idx < IC; ⁠c_idx++) {
+				H_offset_i = ⁠c_idx * IH * IW + C_offset_i;
+				H_offset_k = ⁠c_idx * KH * KW + C_offset_k;
+				for (int rowStride = 0; rowStride < OH; rowStride++) {
+					W_offset_o = rowStride * OW + H_offset_o;
+					for (int colStride = 0; colStride < OW; colStride++) {
+						float sum = 0;
+						g_idx_o = colStride + W_offset_o;
+						for (int y = rowStride * stride; y < rowStride * stride + KH; y++) {
+							W_offset_i = y * IW + H_offset_i;
+							W_offset_k = (y - rowStride * stride) * KH + H_offset_k;
+							for (int x = colStride * stride; x < colStride * stride + KW; x++) {
+								⁠g_idx_i = x + W_offset_i;
+								g_idx_k = (x - colStride * stride) + W_offset_k;
+								sum += input[⁠g_idx_i] * weight[g_idx_k];
+							}
+						}
+						output[g_idx_o] += sum;
+					}
+				}
+			}
+		}
+	}
+}
+
+
+void valueCheck(vector<float>& Input, int IN, int IC, int IH, int IW, bool one = false) {
+	std::cout << "===== valueCheck func =====" << std::endl;
+	if (one) IN = 1;
+	int N_offset = IC * IH * IW;
+	int C_offset, H_offset, W_offset, g_idx;
+	for (int ⁠n_idx = 0; ⁠n_idx < IN; ⁠n_idx++) {
+		C_offset = ⁠n_idx * N_offset;
+		for (int ⁠c_idx = 0; ⁠c_idx < IC; ⁠c_idx++) {
+			H_offset = ⁠c_idx * IW * IH + C_offset;
+			for (int ⁠h_idx = 0; ⁠h_idx < IH; ⁠h_idx++) {
+				W_offset = ⁠h_idx * IW + H_offset;
+				for (int w_idx = 0; w_idx < IW; w_idx++) {
+					g_idx = w_idx + W_offset;
+					std::cout << setw(5) << Input[g_idx] << " ";
+				}std::cout << std::endl;
+			}std::cout << std::endl; std::cout << std::endl;
+		}
+	}
+}
+
+void scalarTensor(vector<float>& output, int OC, int IC, int KH, int KW, float start = 1.f, int step = 0) {
+	std::cout << "===== scalarTensor func =====" << std::endl;
+	std::cout << "Tensor[" << OC << "][" << IC << "][" << KH << "][" << KW << "]" << std::endl << std::endl;
+	int N_offset = IC * KH * KW;
+	int C_offset, H_offset, W_offset, g_idx;
+	for (int ⁠n_idx = 0; ⁠n_idx < OC; ⁠n_idx++) {
+		C_offset = ⁠n_idx * N_offset;
+		for (int ⁠c_idx = 0; ⁠c_idx < IC; ⁠c_idx++) {
+			H_offset = ⁠c_idx * KH * KW + C_offset;
+			for (int ⁠h_idx = 0; ⁠h_idx < KH; ⁠h_idx++) {
+				W_offset = ⁠h_idx * KW + H_offset;
+				for (int w_idx = 0; w_idx < KW; w_idx++) {
+					g_idx = w_idx + W_offset;
+					start += step;
+					output[g_idx] = start;
+				}
+			}
+		}
+	}
+}
+
+void tofile(vector<float> &Buffer, string fname = "../../output/C_Tensor") {
+	std::ofstream fs(fname, ios::binary);
+	if (fs.is_open())
+		fs.write((const char*)Buffer.data(), Buffer.size() * sizeof(float));
+	fs.close();
+	std::cout << "the output file produced in output folder." << std::endl;
+}
+
+int main()
+{
+	int OC = 3;
+	int IC = 2;
+	int IN = 2;
+	int IH = 4;
+	int IW = 4;
+	int KH = 3;
+	int KW = 3;
+	int TP = 1;
+	int BP = 2;
+	int LP = 3;
+	int RP = 4;
+
+	// weight[OC][lC][KH][KW] 
+	// 임시 weight 값 
+	vector<float> weight(OC * IC * KH * KW);
+	scalarTensor(weight, OC, IC, KH, KW);
+	valueCheck(weight, OC, IC, KH, KW, 1);
+
+	// d[IN][IC][IH][IW] 
+	// 임시 input 값 
+	vector<float> input(IN * IC * IH * IW);
+	scalarTensor(input, IN, IC, IH, IW, 0, 1);
+	valueCheck(input, IN, IC, IH, IW, 1);
+
+	int stride = 1;
+	int OH = ((IH + TP + BP - KH) / stride) + 1;
+	int OW = ((IW + LP + RP - KW) / stride) + 1;
+
+	vector<float> output(IN * OC * OH * OW);
+	vector<float> output_zeropadding(IN * OC * (IH + TP + BP) * (IW + LP + RP));
+
+	long long start_usec3 = duration_cast<microseconds>(system_clock::now().time_since_epoch()).count();
+
+	zeroPadding(output_zeropadding, input, IN, IC, IH, IW, TP, BP, LP, RP);
+	valueCheck(output_zeropadding, IN, IC, (IH + TP + BP) , (IW + LP + RP));
+
+	convolution(output, output_zeropadding, weight, KH, KW, stride, IN, IC, (IH + TP + BP), (IW + LP + RP), OC);
+	valueCheck(output, IN, OC, OH, OW);
+
+	long long end_usec3 = duration_cast<microseconds>(system_clock::now().time_since_epoch()).count();
+	int frame_sec3 = int(end_usec3 - start_usec3);
+
+	std::cout << "======================================================" << std::endl;
+	std::cout << "dur time :: " << frame_sec3 << " [micro sec]" << std::endl;
+	tofile(output, "../../output/C_Tensor_zp");
+}
+