Skip to content

Commit cfdbf4e

Browse files
Wong4jnv-kkudrynski
authored andcommitted
[BERT/Paddle] BERT Paddle initial release
1 parent b1fc3c4 commit cfdbf4e

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

54 files changed

+126382
-0
lines changed
Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,15 @@
1+
ARG FROM_IMAGE_NAME=nvcr.io/nvidia/paddlepaddle:22.08-py3
2+
3+
FROM ${FROM_IMAGE_NAME}
4+
5+
RUN apt-get update && apt-get install -y pbzip2 pv bzip2 cabextract
6+
7+
ENV BERT_PREP_WORKING_DIR /workspace/bert/data
8+
ADD requirements.txt /workspace/
9+
WORKDIR /workspace/
10+
RUN pip install --no-cache-dir -r requirements.txt
11+
RUN git clone https://github.com/attardi/wikiextractor.git && cd wikiextractor && git checkout 6408a430fc504a38b04d37ce5e7fc740191dee16 && cd ..
12+
RUN git clone https://github.com/soskek/bookcorpus.git
13+
14+
ADD . /workspace/bert
15+
WORKDIR /workspace/bert

PaddlePaddle/LanguageModeling/BERT/README.md

Lines changed: 928 additions & 0 deletions
Large diffs are not rendered by default.
Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
# Copyright (c) 2022 NVIDIA Corporation. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
{
2+
"attention_probs_dropout_prob": 0.1,
3+
"hidden_act": "gelu",
4+
"hidden_dropout_prob": 0.1,
5+
"hidden_size": 768,
6+
"initializer_range": 0.02,
7+
"intermediate_size": 3072,
8+
"max_position_embeddings": 512,
9+
"num_attention_heads": 12,
10+
"num_hidden_layers": 12,
11+
"type_vocab_size": 2,
12+
"vocab_size": 28996
13+
}
Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
{
2+
"attention_probs_dropout_prob": 0.1,
3+
"hidden_act": "gelu",
4+
"hidden_dropout_prob": 0.1,
5+
"hidden_size": 768,
6+
"initializer_range": 0.02,
7+
"intermediate_size": 3072,
8+
"max_position_embeddings": 512,
9+
"num_attention_heads": 12,
10+
"num_hidden_layers": 12,
11+
"type_vocab_size": 2,
12+
"vocab_size": 30522
13+
}
Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
{
2+
"attention_probs_dropout_prob": 0.1,
3+
"hidden_act": "gelu",
4+
"hidden_dropout_prob": 0.1,
5+
"hidden_size": 1024,
6+
"initializer_range": 0.02,
7+
"intermediate_size": 4096,
8+
"max_position_embeddings": 512,
9+
"num_attention_heads": 16,
10+
"num_hidden_layers": 24,
11+
"type_vocab_size": 2,
12+
"vocab_size": 28996
13+
}
Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
{
2+
"attention_probs_dropout_prob": 0.1,
3+
"hidden_act": "gelu",
4+
"hidden_dropout_prob": 0.1,
5+
"hidden_size": 1024,
6+
"initializer_range": 0.02,
7+
"intermediate_size": 4096,
8+
"max_position_embeddings": 512,
9+
"num_attention_heads": 16,
10+
"num_hidden_layers": 24,
11+
"type_vocab_size": 2,
12+
"vocab_size": 30522
13+
}

0 commit comments

Comments
 (0)