-
Notifications
You must be signed in to change notification settings - Fork 687
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Implement oneflow.embedding op (#8110)
* impl embedding op * refine * fix the norm logic * rename kernel * refine * impl in python * refine * add unit tests and fix bug * refine * refine kernel * fix typo * fix * move functor * use primitive memset * fix int64 * refine renorm kernel and unit test * fix typo * add op dev states * use check_graph * fix graph backward * refine unit test * refine unit test * add global test * debug * fix sparse unit test * fix * fix * auto format by CI * fix clang error * fix unit test * auto format by CI * fix * refine unit test * refine kernel * refine * fix * refine renorm kernel * add sync * refine * rm test case(tmp) * add unit test * fix * add sync * try another test case * auto format by CI * fix * auto format by CI * remove autotest case for scale_by_grad Co-authored-by: oneflow-ci-bot <ci-bot@oneflow.org> Co-authored-by: mergify[bot] <37929162+mergify[bot]@users.noreply.github.com>
- Loading branch information
1 parent
445e236
commit 45cfcb5
Showing
15 changed files
with
1,286 additions
and
87 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,84 @@ | ||
/* | ||
Copyright 2020 The OneFlow Authors. All rights reserved. | ||
Licensed under the Apache License, Version 2.0 (the "License"); | ||
you may not use this file except in compliance with the License. | ||
You may obtain a copy of the License at | ||
http://www.apache.org/licenses/LICENSE-2.0 | ||
Unless required by applicable law or agreed to in writing, software | ||
distributed under the License is distributed on an "AS IS" BASIS, | ||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
See the License for the specific language governing permissions and | ||
limitations under the License. | ||
*/ | ||
|
||
#include "oneflow/core/common/container_util.h" | ||
#include "oneflow/core/framework/op_expr_grad_function.h" | ||
#include "oneflow/core/framework/op_expr.h" | ||
#include "oneflow/core/framework/op_interpreter/op_interpreter_util.h" | ||
#include "oneflow/core/functional/functional.h" | ||
|
||
namespace oneflow { | ||
namespace one { | ||
|
||
struct EmbeddingCaptureState : public AutoGradCaptureState { | ||
int64_t padding_idx = -1; | ||
bool scale_grad_by_freq = false; | ||
bool requires_grad = false; | ||
}; | ||
|
||
class Embedding : public OpExprGradFunction<EmbeddingCaptureState> { | ||
public: | ||
Maybe<void> Init(const OpExpr& op) override; | ||
Maybe<void> Capture(EmbeddingCaptureState* ctx, const TensorTuple& inputs, | ||
const TensorTuple& outputs, const AttrMap& attrs) const override; | ||
Maybe<void> Apply(const EmbeddingCaptureState* ctx, const TensorTuple& out_grads, | ||
TensorTuple* in_grads) const override; | ||
|
||
private: | ||
AttrMap base_attrs_; | ||
}; | ||
|
||
Maybe<void> Embedding::Init(const OpExpr& op) { | ||
const UserOpExpr* fw_op_expr = dynamic_cast<const UserOpExpr*>(&op); | ||
CHECK_NOTNULL_OR_RETURN(fw_op_expr) << "Forward op must be not null"; | ||
base_attrs_ = MakeAttrMapFromUserOpConf(fw_op_expr->proto()); | ||
return Maybe<void>::Ok(); | ||
} | ||
|
||
Maybe<void> Embedding::Capture(EmbeddingCaptureState* ctx, const TensorTuple& inputs, | ||
const TensorTuple& outputs, const AttrMap& attrs) const { | ||
ctx->requires_grad = JUST(oneflow::VectorAt(inputs, 0))->requires_grad(); | ||
if (!ctx->requires_grad) { return Maybe<void>::Ok(); } | ||
|
||
ctx->SaveTensorForBackward(JUST(oneflow::VectorAt(inputs, 0))); | ||
ctx->SaveTensorForBackward(JUST(oneflow::VectorAt(inputs, 1))); | ||
|
||
ComposedAttrMap composed_attrs(attrs, base_attrs_); | ||
ctx->padding_idx = JUST(composed_attrs.GetAttr<int64_t>("padding_idx")); | ||
ctx->scale_grad_by_freq = JUST(composed_attrs.GetAttr<bool>("scale_grad_by_freq")); | ||
return Maybe<void>::Ok(); | ||
} | ||
|
||
Maybe<void> Embedding::Apply(const EmbeddingCaptureState* ctx, const TensorTuple& out_grads, | ||
TensorTuple* in_grads) const { | ||
CHECK_EQ_OR_RETURN(out_grads.size(), 1); // NOLINT(maybe-need-error-msg) | ||
if (!ctx->requires_grad) { return Maybe<void>::Ok(); } | ||
|
||
in_grads->resize(ctx->SavedTensors().size()); | ||
const auto& weight = JUST(oneflow::VectorAt(ctx->SavedTensors(), 0)); | ||
const auto& indices = JUST(oneflow::VectorAt(ctx->SavedTensors(), 1)); | ||
int64_t padding_idx = ctx->padding_idx; | ||
bool scale_grad_by_freq = ctx->scale_grad_by_freq; | ||
|
||
JUST(oneflow::VectorAt(*in_grads, 0)) = JUST(functional::EmbeddingGrad( | ||
JUST(oneflow::VectorAt(out_grads, 0)), weight, indices, padding_idx, scale_grad_by_freq)); | ||
return Maybe<void>::Ok(); | ||
} | ||
|
||
REGISTER_OP_EXPR_GRAD_FUNCTION("embedding", Embedding); | ||
|
||
} // namespace one | ||
} // namespace oneflow |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.