How to make a region of interest proposal from convolutional feature maps?

Problem

Keras does not have any direct implementation of region of interest pooling. I am aware of how to perform maxpooling, but I don't know how to get bounding boxes from feature maps passed from convolutional layer.

Is there any way to directly implement a region proposal algorithm?

Example

Let's say there is an architecture like this:

enter image description here

So we have a multi-input neural network architecture that eventually leads to the ROI MaxPool layer. We have three inputs, screenshot, textmaps and candidates, let's take candidates out. Then we would have such code in Keras:

from keras.models import Model

from keras.layers import Input, Dense, Conv2D, ZeroPadding2D, MaxPooling2D, BatchNormalization, concatenate

from keras.activations import relu

from keras.initializers import RandomUniform, Constant, TruncatedNormal



#  Network 1, Layer 1

screenshot = Input(shape=(1280, 1280, 0),

                   dtype='float32',

                   name='screenshot')

# padded1 = ZeroPadding2D(padding=5, data_format=None)(screenshot)

conv1 = Conv2D(filters=96,

               kernel_size=11,

               strides=(4, 4),

               activation=relu,

               padding='same')(screenshot)

# conv1 = Conv2D(filters=96, kernel_size=11, strides=(4, 4), activation=relu, padding='same')(padded1)

pooling1 = MaxPooling2D(pool_size=(3, 3),

                        strides=(2, 2),

                        padding='same')(conv1)

normalized1 = BatchNormalization()(pooling1)  # https://stats.stackexchange.com/questions/145768/importance-of-local-response-normalization-in-cnn



# Network 1, Layer 2



# padded2 = ZeroPadding2D(padding=2, data_format=None)(normalized1)

conv2 = Conv2D(filters=256,

               kernel_size=5,

               activation=relu,

               padding='same')(normalized1)

# conv2 = Conv2D(filters=256, kernel_size=5, activation=relu, padding='same')(padded2)

normalized2 = BatchNormalization()(conv2)

# padded3 = ZeroPadding2D(padding=1, data_format=None)(normalized2)

conv3 = Conv2D(filters=384,

               kernel_size=3,

               activation=relu,

               padding='same',

               kernel_initializer=TruncatedNormal(stddev=0.01),

               bias_initializer=Constant(value=0.1))(normalized2)

# conv3 = Conv2D(filters=384, kernel_size=3, activation=relu, padding='same',

#               kernel_initializer=RandomUniform(stddev=0.1),

#               bias_initializer=Constant(value=0.1))(padded3)



# Network 2, Layer 1



textmaps = Input(shape=(160, 160, 128),

                 dtype='float32',

                 name='textmaps')

txt_conv1 = Conv2D(filters=48,

                   kernel_size=1,

                   activation=relu,

                   padding='same',

                   kernel_initializer=TruncatedNormal(stddev=0.01),

                   bias_initializer=Constant(value=0.1))(textmaps)



# (Network 1 + Network 2), Layer 1



merged = concatenate([conv3, txt_conv1], axis=-1)

merged_padding = ZeroPadding2D(padding=2, data_format=None)(merged)

merged_conv = Conv2D(filters=96,

                     kernel_size=5,

                     activation=relu, padding='same',

                     kernel_initializer=TruncatedNormal(stddev=0.01),

                     bias_initializer=Constant(value=0.1))(merged_padding)

If you look at the end of the code (and architecture itself), we pass concatenated activations from two different Conv+ReLu layers and then pass it to ROI MaxPool layer.

Thank you!

edited 27 mins ago

asked 37 mins ago

ShellRox

1978

add a comment |

Problem

Is there any way to directly implement a region proposal algorithm?

Example

Let's say there is an architecture like this:

enter image description here

from keras.models import Model

from keras.layers import Input, Dense, Conv2D, ZeroPadding2D, MaxPooling2D, BatchNormalization, concatenate

from keras.activations import relu

from keras.initializers import RandomUniform, Constant, TruncatedNormal



#  Network 1, Layer 1

screenshot = Input(shape=(1280, 1280, 0),

                   dtype='float32',

                   name='screenshot')

# padded1 = ZeroPadding2D(padding=5, data_format=None)(screenshot)

conv1 = Conv2D(filters=96,

               kernel_size=11,

               strides=(4, 4),

               activation=relu,

               padding='same')(screenshot)

# conv1 = Conv2D(filters=96, kernel_size=11, strides=(4, 4), activation=relu, padding='same')(padded1)

pooling1 = MaxPooling2D(pool_size=(3, 3),

                        strides=(2, 2),

                        padding='same')(conv1)

normalized1 = BatchNormalization()(pooling1)  # https://stats.stackexchange.com/questions/145768/importance-of-local-response-normalization-in-cnn



# Network 1, Layer 2



# padded2 = ZeroPadding2D(padding=2, data_format=None)(normalized1)

conv2 = Conv2D(filters=256,

               kernel_size=5,

               activation=relu,

               padding='same')(normalized1)

# conv2 = Conv2D(filters=256, kernel_size=5, activation=relu, padding='same')(padded2)

normalized2 = BatchNormalization()(conv2)

# padded3 = ZeroPadding2D(padding=1, data_format=None)(normalized2)

conv3 = Conv2D(filters=384,

               kernel_size=3,

               activation=relu,

               padding='same',

               kernel_initializer=TruncatedNormal(stddev=0.01),

               bias_initializer=Constant(value=0.1))(normalized2)

# conv3 = Conv2D(filters=384, kernel_size=3, activation=relu, padding='same',

#               kernel_initializer=RandomUniform(stddev=0.1),

#               bias_initializer=Constant(value=0.1))(padded3)



# Network 2, Layer 1



textmaps = Input(shape=(160, 160, 128),

                 dtype='float32',

                 name='textmaps')

txt_conv1 = Conv2D(filters=48,

                   kernel_size=1,

                   activation=relu,

                   padding='same',

                   kernel_initializer=TruncatedNormal(stddev=0.01),

                   bias_initializer=Constant(value=0.1))(textmaps)



# (Network 1 + Network 2), Layer 1



merged = concatenate([conv3, txt_conv1], axis=-1)

merged_padding = ZeroPadding2D(padding=2, data_format=None)(merged)

merged_conv = Conv2D(filters=96,

                     kernel_size=5,

                     activation=relu, padding='same',

                     kernel_initializer=TruncatedNormal(stddev=0.01),

                     bias_initializer=Constant(value=0.1))(merged_padding)

If you look at the end of the code (and architecture itself), we pass concatenated activations from two different Conv+ReLu layers and then pass it to ROI MaxPool layer.

Thank you!

edited 27 mins ago

asked 37 mins ago

ShellRox

1978

add a comment |

Problem

Is there any way to directly implement a region proposal algorithm?

Example

Let's say there is an architecture like this:

enter image description here

from keras.models import Model

from keras.layers import Input, Dense, Conv2D, ZeroPadding2D, MaxPooling2D, BatchNormalization, concatenate

from keras.activations import relu

from keras.initializers import RandomUniform, Constant, TruncatedNormal



#  Network 1, Layer 1

screenshot = Input(shape=(1280, 1280, 0),

                   dtype='float32',

                   name='screenshot')

# padded1 = ZeroPadding2D(padding=5, data_format=None)(screenshot)

conv1 = Conv2D(filters=96,

               kernel_size=11,

               strides=(4, 4),

               activation=relu,

               padding='same')(screenshot)

# conv1 = Conv2D(filters=96, kernel_size=11, strides=(4, 4), activation=relu, padding='same')(padded1)

pooling1 = MaxPooling2D(pool_size=(3, 3),

                        strides=(2, 2),

                        padding='same')(conv1)

normalized1 = BatchNormalization()(pooling1)  # https://stats.stackexchange.com/questions/145768/importance-of-local-response-normalization-in-cnn



# Network 1, Layer 2



# padded2 = ZeroPadding2D(padding=2, data_format=None)(normalized1)

conv2 = Conv2D(filters=256,

               kernel_size=5,

               activation=relu,

               padding='same')(normalized1)

# conv2 = Conv2D(filters=256, kernel_size=5, activation=relu, padding='same')(padded2)

normalized2 = BatchNormalization()(conv2)

# padded3 = ZeroPadding2D(padding=1, data_format=None)(normalized2)

conv3 = Conv2D(filters=384,

               kernel_size=3,

               activation=relu,

               padding='same',

               kernel_initializer=TruncatedNormal(stddev=0.01),

               bias_initializer=Constant(value=0.1))(normalized2)

# conv3 = Conv2D(filters=384, kernel_size=3, activation=relu, padding='same',

#               kernel_initializer=RandomUniform(stddev=0.1),

#               bias_initializer=Constant(value=0.1))(padded3)



# Network 2, Layer 1



textmaps = Input(shape=(160, 160, 128),

                 dtype='float32',

                 name='textmaps')

txt_conv1 = Conv2D(filters=48,

                   kernel_size=1,

                   activation=relu,

                   padding='same',

                   kernel_initializer=TruncatedNormal(stddev=0.01),

                   bias_initializer=Constant(value=0.1))(textmaps)



# (Network 1 + Network 2), Layer 1



merged = concatenate([conv3, txt_conv1], axis=-1)

merged_padding = ZeroPadding2D(padding=2, data_format=None)(merged)

merged_conv = Conv2D(filters=96,

                     kernel_size=5,

                     activation=relu, padding='same',

                     kernel_initializer=TruncatedNormal(stddev=0.01),

                     bias_initializer=Constant(value=0.1))(merged_padding)

If you look at the end of the code (and architecture itself), we pass concatenated activations from two different Conv+ReLu layers and then pass it to ROI MaxPool layer.

Thank you!

edited 27 mins ago

asked 37 mins ago

ShellRox

1978

Problem

Is there any way to directly implement a region proposal algorithm?

Example

Let's say there is an architecture like this:

enter image description here

from keras.models import Model

from keras.layers import Input, Dense, Conv2D, ZeroPadding2D, MaxPooling2D, BatchNormalization, concatenate

from keras.activations import relu

from keras.initializers import RandomUniform, Constant, TruncatedNormal



#  Network 1, Layer 1

screenshot = Input(shape=(1280, 1280, 0),

                   dtype='float32',

                   name='screenshot')

# padded1 = ZeroPadding2D(padding=5, data_format=None)(screenshot)

conv1 = Conv2D(filters=96,

               kernel_size=11,

               strides=(4, 4),

               activation=relu,

               padding='same')(screenshot)

# conv1 = Conv2D(filters=96, kernel_size=11, strides=(4, 4), activation=relu, padding='same')(padded1)

pooling1 = MaxPooling2D(pool_size=(3, 3),

                        strides=(2, 2),

                        padding='same')(conv1)

normalized1 = BatchNormalization()(pooling1)  # https://stats.stackexchange.com/questions/145768/importance-of-local-response-normalization-in-cnn



# Network 1, Layer 2



# padded2 = ZeroPadding2D(padding=2, data_format=None)(normalized1)

conv2 = Conv2D(filters=256,

               kernel_size=5,

               activation=relu,

               padding='same')(normalized1)

# conv2 = Conv2D(filters=256, kernel_size=5, activation=relu, padding='same')(padded2)

normalized2 = BatchNormalization()(conv2)

# padded3 = ZeroPadding2D(padding=1, data_format=None)(normalized2)

conv3 = Conv2D(filters=384,

               kernel_size=3,

               activation=relu,

               padding='same',

               kernel_initializer=TruncatedNormal(stddev=0.01),

               bias_initializer=Constant(value=0.1))(normalized2)

# conv3 = Conv2D(filters=384, kernel_size=3, activation=relu, padding='same',

#               kernel_initializer=RandomUniform(stddev=0.1),

#               bias_initializer=Constant(value=0.1))(padded3)



# Network 2, Layer 1



textmaps = Input(shape=(160, 160, 128),

                 dtype='float32',

                 name='textmaps')

txt_conv1 = Conv2D(filters=48,

                   kernel_size=1,

                   activation=relu,

                   padding='same',

                   kernel_initializer=TruncatedNormal(stddev=0.01),

                   bias_initializer=Constant(value=0.1))(textmaps)



# (Network 1 + Network 2), Layer 1



merged = concatenate([conv3, txt_conv1], axis=-1)

merged_padding = ZeroPadding2D(padding=2, data_format=None)(merged)

merged_conv = Conv2D(filters=96,

                     kernel_size=5,

                     activation=relu, padding='same',

                     kernel_initializer=TruncatedNormal(stddev=0.01),

                     bias_initializer=Constant(value=0.1))(merged_padding)

If you look at the end of the code (and architecture itself), we pass concatenated activations from two different Conv+ReLu layers and then pass it to ROI MaxPool layer.

Thank you!

python keras convnet

edited 27 mins ago

asked 37 mins ago

ShellRox

1978

edited 27 mins ago

asked 37 mins ago

ShellRox

1978

edited 27 mins ago

asked 37 mins ago

ShellRox

1978

asked 37 mins ago

ShellRox

1978

asked 37 mins ago

ShellRox

1978

add a comment |

0

active

oldest

votes

Your Answer

StackExchange.ifUsing("editor", function () {
return StackExchange.using("mathjaxEditing", function () {
StackExchange.MarkdownEditor.creationCallbacks.add(function (editor, postfix) {
StackExchange.mathjaxEditing.prepareWmdForMathJax(editor, postfix, [["$", "$"], ["\$","\$"]]);
});
});
}, "mathjax-editing");

StackExchange.ready(function() {
var channelOptions = {
tags: "".split(" "),
id: "557"
};
initTagRenderer("".split(" "), "".split(" "), channelOptions);

StackExchange.using("externalEditor", function() {
// Have to fire editor after snippets, if snippets enabled
if (StackExchange.settings.snippets.snippetsEnabled) {
StackExchange.using("snippets", function() {
createEditor();
});
}
else {
createEditor();
}
});

function createEditor() {
StackExchange.prepareEditor({
heartbeatType: 'answer',
autoActivateHeartbeat: false,
convertImagesToLinks: false,
noModals: true,
showLowRepImageUploadWarning: true,
reputationToPostImages: null,
bindNavPrevention: true,
postfix: "",
imageUploader: {
brandingHtml: "Powered by u003ca class="icon-imgur-white" href="https://imgur.com/"u003eu003c/au003e",
contentPolicyHtml: "User contributions licensed under u003ca href="https://creativecommons.org/licenses/by-sa/3.0/"u003ecc by-sa 3.0 with attribution requiredu003c/au003e u003ca href="https://stackoverflow.com/legal/content-policy"u003e(content policy)u003c/au003e",
allowUrls: true
},
onDemand: true,
discardSelector: ".discard-answer"
,immediatelyShowMarkdownHelp:true
});

}
});

draft saved

draft discarded

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

StackExchange.ready(
function () {
StackExchange.openid.initPostLogin('.new-post-login', 'https%3a%2f%2fdatascience.stackexchange.com%2fquestions%2f44391%2fhow-to-make-a-region-of-interest-proposal-from-convolutional-feature-maps%23new-answer', 'question_page');
}
);

Post as a guest

Name

Required, but never shown

0

active

oldest

votes

0

active

oldest

votes

draft saved

draft discarded

Thanks for contributing an answer to Data Science Stack Exchange!

Please be sure to answer the question. Provide details and share your research!

But avoid …

Asking for help, clarification, or responding to other answers.

Making statements based on opinion; back them up with references or personal experience.

Use MathJax to format equations. MathJax reference.

To learn more, see our tips on writing great answers.

draft saved

draft discarded

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Post as a guest

Name

Required, but never shown

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Name

Required, but never shown

Name

Required, but never shown

This page is only for reference, If you need detailed information, please check here

搜尋此網誌

Htydjtk

How to make a region of interest proposal from convolutional feature maps?

Problem

Example

Problem

Example

Problem

Example

Problem

Example

0

Your Answer

Post as a guest

0

0

Post as a guest