AllentDan
diff --git a/‎lesson6-Segmentation/ResNet.cpp
Lines changed: 240 additions & 0 deletions b/‎lesson6-Segmentation/ResNet.cpp
Lines changed: 240 additions & 0 deletions
diff --git a/‎lesson6-Segmentation/ResNet.h
Lines changed: 65 additions & 0 deletions b/‎lesson6-Segmentation/ResNet.h
Lines changed: 65 additions & 0 deletions
@@ -0,0 +1,240 @@
+#include "ResNet.h"
+
+BlockImpl::BlockImpl(int64_t inplanes, int64_t planes, int64_t stride_,
+    torch::nn::Sequential downsample_, int groups, int base_width, bool _is_basic)
+{
+    downsample = downsample_;
+    stride = stride_;
+	int width = int(planes * (base_width / 64.)) * groups;
+
+    conv1 = torch::nn::Conv2d(conv_options(inplanes, width, 3, stride_, 1, groups, false));
+    bn1 = torch::nn::BatchNorm2d(torch::nn::BatchNorm2dOptions(width));
+    conv2 = torch::nn::Conv2d(conv_options(width, width, 3, 1, 1, groups, false));
+    bn2 = torch::nn::BatchNorm2d(torch::nn::BatchNorm2dOptions(width));
+    is_basic = _is_basic;
+    if (!is_basic) {
+        conv1 = torch::nn::Conv2d(conv_options(inplanes, width, 1, 1, 0, 1, false));
+        conv2 = torch::nn::Conv2d(conv_options(width, width, 3, stride_, 1, groups, false));
+        conv3 = torch::nn::Conv2d(conv_options(width, planes * 4, 1, 1, 0, 1, false));
+        bn3 = torch::nn::BatchNorm2d(torch::nn::BatchNorm2dOptions(planes * 4));
+    }
+
+    register_module("conv1", conv1);
+    register_module("bn1", bn1);
+    register_module("conv2", conv2);
+    register_module("bn2", bn2);
+    if (!is_basic) {
+        register_module("conv3", conv3);
+        register_module("bn3", bn3);
+    }
+
+    if (!downsample->is_empty()) {
+        register_module("downsample", downsample);
+    }
+}
+
+torch::Tensor BlockImpl::forward(torch::Tensor x) {
+    torch::Tensor residual = x.clone();
+
+    x = conv1->forward(x);
+    x = bn1->forward(x);
+    x = torch::relu(x);
+
+    x = conv2->forward(x);
+    x = bn2->forward(x);
+
+    if (!is_basic) {
+        x = torch::relu(x);
+        x = conv3->forward(x);
+        x = bn3->forward(x);
+    }
+
+    if (!downsample->is_empty()) {
+        residual = downsample->forward(residual);
+    }
+
+    x += residual;
+    x = torch::relu(x);
+
+    return x;
+}
+
+ResNetImpl::ResNetImpl(std::vector<int> layers, int num_classes, std::string model_type, int _groups, int _width_per_group)
+{
+    if (model_type != "resnet18" && model_type != "resnet34")
+    {
+        expansion = 4;
+        is_basic = false;
+    }
+	groups = _groups;
+	base_width = _width_per_group;
+    conv1 = torch::nn::Conv2d(conv_options(3, 64, 7, 2, 3, 1, false));
+    bn1 = torch::nn::BatchNorm2d(torch::nn::BatchNorm2dOptions(64));
+    layer1 = torch::nn::Sequential(_make_layer(64, layers[0]));
+    layer2 = torch::nn::Sequential(_make_layer(128, layers[1], 2));
+    layer3 = torch::nn::Sequential(_make_layer(256, layers[2], 2));
+    layer4 = torch::nn::Sequential(_make_layer(512, layers[3], 2));
+
+    fc = torch::nn::Linear(512 * expansion, num_classes);
+    register_module("conv1", conv1);
+    register_module("bn1", bn1);
+    register_module("layer1", layer1);
+    register_module("layer2", layer2);
+    register_module("layer3", layer3);
+    register_module("layer4", layer4);
+    register_module("fc", fc);
+}
+
+
+torch::Tensor  ResNetImpl::forward(torch::Tensor x) {
+    x = conv1->forward(x);
+    x = bn1->forward(x);
+    x = torch::relu(x);
+    x = torch::max_pool2d(x, 3, 2, 1);
+
+    x = layer1->forward(x);
+    x = layer2->forward(x);
+    x = layer3->forward(x);
+    x = layer4->forward(x);
+
+    x = torch::avg_pool2d(x, 7, 1);
+    x = x.view({ x.sizes()[0], -1 });
+    x = fc->forward(x);
+
+    return torch::log_softmax(x, 1);
+}
+
+std::vector<torch::Tensor> ResNetImpl::features(torch::Tensor x){
+    std::vector<torch::Tensor> features;
+    features.push_back(x);
+    x = conv1->forward(x);
+    x = bn1->forward(x);
+    x = torch::relu(x);
+    features.push_back(x);
+    x = torch::max_pool2d(x, 3, 2, 1);
+
+    x = layer1->forward(x);
+    features.push_back(x);
+    x = layer2->forward(x);
+    features.push_back(x);
+    x = layer3->forward(x);
+    features.push_back(x);
+    x = layer4->forward(x);
+    features.push_back(x);
+
+    return features;
+}
+
+torch::nn::Sequential ResNetImpl::_make_layer(int64_t planes, int64_t blocks, int64_t stride) {
+
+    torch::nn::Sequential downsample;
+    if (stride != 1 || inplanes != planes * expansion) {
+        downsample = torch::nn::Sequential(
+            torch::nn::Conv2d(conv_options(inplanes, planes *  expansion, 1, stride, 0, 1, false)),
+            torch::nn::BatchNorm2d(planes *  expansion)
+        );
+    }
+    torch::nn::Sequential layers;
+    layers->push_back(Block(inplanes, planes, stride, downsample, groups, base_width, is_basic));
+    inplanes = planes *  expansion;
+    for (int64_t i = 1; i < blocks; i++) {
+        layers->push_back(Block(inplanes, planes, 1, torch::nn::Sequential(), groups, base_width,is_basic));
+    }
+
+    return layers;
+}
+
+void ResNetImpl::make_dilated(std::vector<int> stage_list, std::vector<int> dilation_list) {
+	if (stage_list.size() != dilation_list.size()) {
+		std::cout << "make sure stage list len equal to dilation list len";
+		return;
+	}
+	std::map<int, torch::nn::Sequential> stage_dict = {};
+	stage_dict.insert(std::pair<int, torch::nn::Sequential>(5, this->layer4));
+	stage_dict.insert(std::pair<int, torch::nn::Sequential>(4, this->layer3));
+	stage_dict.insert(std::pair<int, torch::nn::Sequential>(3, this->layer2));
+	stage_dict.insert(std::pair<int, torch::nn::Sequential>(2, this->layer1));
+	for (int i = 0; i < stage_list.size(); i++) {
+		int dilation_rate = dilation_list[i];
+		for (auto m : stage_dict[stage_list[i]]->modules()) {
+			if (m->name() == "torch::nn::Conv2dImpl") {
+				m->as<torch::nn::Conv2d>()->options.stride(1);
+				m->as<torch::nn::Conv2d>()->options.dilation(dilation_rate);
+				int kernel_size = m->as<torch::nn::Conv2d>()->options.kernel_size()->at(0);
+				m->as<torch::nn::Conv2d>()->options.padding((kernel_size / 2) * dilation_rate);
+			}
+		}
+	}
+	return;
+}
+
+ResNet resnet18(int64_t num_classes) {
+    std::vector<int> layers = { 2, 2, 2, 2 };
+    ResNet model(layers, num_classes, "resnet18");
+    return model;
+}
+
+ResNet resnet34(int64_t num_classes) {
+    std::vector<int> layers = { 3, 4, 6, 3 };
+    ResNet model(layers, num_classes, "resnet34");
+    return model;
+}
+
+ResNet resnet50(int64_t num_classes) {
+    std::vector<int> layers = { 3, 4, 6, 3 };
+    ResNet model(layers, num_classes, "resnet50");
+    return model;
+}
+
+ResNet resnet101(int64_t num_classes) {
+    std::vector<int> layers = { 3, 4, 23, 3 };
+    ResNet model(layers, num_classes, "resnet101");
+    return model;
+}
+
+ResNet pretrained_resnet(int64_t num_classes, std::string model_name, std::string weight_path){
+    std::map<std::string, std::vector<int>> name2layers = getParams();
+	int groups = 1;
+	int width_per_group = 64;
+	if (model_name == "resnext50_32x4d") {
+		groups = 32; width_per_group = 4;
+	}
+	if (model_name == "resnext101_32x8d") {
+		groups = 32; width_per_group = 8;
+	}
+    ResNet net_pretrained = ResNet(name2layers[model_name],1000,model_name,groups,width_per_group);
+    torch::load(net_pretrained, weight_path);
+    if(num_classes == 1000) return net_pretrained;
+    ResNet module = ResNet(name2layers[model_name],num_classes,model_name);
+
+    torch::OrderedDict<std::string, at::Tensor> pretrained_dict = net_pretrained->named_parameters();
+    torch::OrderedDict<std::string, at::Tensor> model_dict = module->named_parameters();
+
+    for (auto n = pretrained_dict.begin(); n != pretrained_dict.end(); n++)
+    {
+        if (strstr((*n).key().data(), "fc.")) {
+            continue;
+        }
+        model_dict[(*n).key()] = (*n).value();
+    }
+
+    torch::autograd::GradMode::set_enabled(false);  // make parameters copying possible
+    auto new_params = model_dict; // implement this
+    auto params = module->named_parameters(true /*recurse*/);
+    auto buffers = module->named_buffers(true /*recurse*/);
+    for (auto& val : new_params) {
+        auto name = val.key();
+        auto* t = params.find(name);
+        if (t != nullptr) {
+            t->copy_(val.value());
+        }
+        else {
+            t = buffers.find(name);
+            if (t != nullptr) {
+                t->copy_(val.value());
+            }
+        }
+    }
+    torch::autograd::GradMode::set_enabled(true);
+    return module;
+}
@@ -0,0 +1,65 @@
+#ifndef RESNET_H
+#define RESNET_H
+#include"util.h"
+
+class BlockImpl : public torch::nn::Module {
+public:
+    BlockImpl(int64_t inplanes, int64_t planes, int64_t stride_ = 1,
+        torch::nn::Sequential downsample_ = nullptr, int groups = 1, int base_width = 64, bool is_basic = true);
+    torch::Tensor forward(torch::Tensor x);
+    torch::nn::Sequential downsample{ nullptr };
+private:
+    bool is_basic = true;
+    int64_t stride = 1;
+    torch::nn::Conv2d conv1{ nullptr };
+    torch::nn::BatchNorm2d bn1{ nullptr };
+    torch::nn::Conv2d conv2{ nullptr };
+    torch::nn::BatchNorm2d bn2{ nullptr };
+    torch::nn::Conv2d conv3{ nullptr };
+    torch::nn::BatchNorm2d bn3{ nullptr };
+
+};
+TORCH_MODULE(Block);
+
+
+class ResNetImpl : public torch::nn::Module {
+public:
+    ResNetImpl(std::vector<int> layers, int num_classes = 1000, std::string model_type = "resnet18",
+		int groups = 1, int width_per_group = 64);
+    torch::Tensor forward(torch::Tensor x);
+    std::vector<torch::Tensor> features(torch::Tensor x);
+    torch::nn::Sequential _make_layer(int64_t planes, int64_t blocks, int64_t stride = 1);
+	void make_dilated(std::vector<int> stage_list, std::vector<int> dilation_list);
+private:
+    int expansion = 1; bool is_basic = true;
+	int64_t inplanes = 64; int groups = 1; int base_width = 64;
+    torch::nn::Conv2d conv1{ nullptr };
+    torch::nn::BatchNorm2d bn1{ nullptr };
+    torch::nn::Sequential layer1{ nullptr };
+    torch::nn::Sequential layer2{ nullptr };
+    torch::nn::Sequential layer3{ nullptr };
+    torch::nn::Sequential layer4{ nullptr };
+    torch::nn::Linear fc{nullptr};
+};
+TORCH_MODULE(ResNet);
+
+inline std::map<std::string, std::vector<int>> getParams(){
+    std::map<std::string, std::vector<int>> name2layers = {};
+    name2layers.insert(std::pair<std::string, std::vector<int>>("resnet18",{2, 2, 2, 2}));
+    name2layers.insert(std::pair<std::string, std::vector<int>>("resnet34",{3, 4, 6, 3}));
+    name2layers.insert(std::pair<std::string, std::vector<int>>("resnet50",{3, 4, 6, 3}));
+    name2layers.insert(std::pair<std::string, std::vector<int>>("resnet101",{3, 4, 23, 3}));
+	name2layers.insert(std::pair<std::string, std::vector<int>>("resnet152", { 3, 8, 36, 3 }));
+	name2layers.insert(std::pair<std::string, std::vector<int>>("resnext50_32x4d", { 3, 4, 6, 3 }));
+	name2layers.insert(std::pair<std::string, std::vector<int>>("resnext101_32x8d", { 3, 4, 23, 3 }));
+
+    return name2layers;
+}
+
+ResNet resnet18(int64_t num_classes);
+ResNet resnet34(int64_t num_classes);
+ResNet resnet50(int64_t num_classes);
+ResNet resnet101(int64_t num_classes);
+
+ResNet pretrained_resnet(int64_t num_classes, std::string model_name, std::string weight_path);
+#endif // RESNET_H