[{"title":"( 31 个子文件 85KB ) Python-大规模transformer语言模型包括BERT","children":[{"title":"NVIDIA-Megatron-LM-fb4cbdc","children":[{"title":"optim","children":[{"title":"__init__.py <span style='color:#111;'> 962B </span>","children":null,"spread":false},{"title":"adam.py <span style='color:#111;'> 5.26KB </span>","children":null,"spread":false}],"spread":true},{"title":"pretrain_bert.py <span style='color:#111;'> 17.25KB </span>","children":null,"spread":false},{"title":"arguments.py <span style='color:#111;'> 13.41KB </span>","children":null,"spread":false},{"title":"fp16","children":[{"title":"loss_scaler.py <span style='color:#111;'> 9.19KB </span>","children":null,"spread":false},{"title":"fp16util.py <span style='color:#111;'> 7.45KB </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 941B </span>","children":null,"spread":false},{"title":"fp16.py <span style='color:#111;'> 30.85KB </span>","children":null,"spread":false}],"spread":true},{"title":"model","children":[{"title":"distributed.py <span style='color:#111;'> 4.53KB </span>","children":null,"spread":false},{"title":"modeling.py <span style='color:#111;'> 62.49KB </span>","children":null,"spread":false},{"title":"model.py <span style='color:#111;'> 3.61KB </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 674B </span>","children":null,"spread":false}],"spread":true},{"title":"scripts","children":[{"title":"pretrain_bert_tfrecords_distributed.sh <span style='color:#111;'> 1.14KB </span>","children":null,"spread":false},{"title":"pretrain_bert_sentencepiece.sh <span style='color:#111;'> 864B </span>","children":null,"spread":false},{"title":"pretrain_bert_distributed.sh <span style='color:#111;'> 1.12KB </span>","children":null,"spread":false},{"title":"pretrain_bert.sh <span style='color:#111;'> 868B </span>","children":null,"spread":false}],"spread":true},{"title":"utils.py <span style='color:#111;'> 5.94KB </span>","children":null,"spread":false},{"title":"configure_data.py <span style='color:#111;'> 8.12KB </span>","children":null,"spread":false},{"title":"requirements.txt <span style='color:#111;'> 79B </span>","children":null,"spread":false},{"title":"learning_rates.py <span style='color:#111;'> 2.92KB </span>","children":null,"spread":false},{"title":"LICENSE <span style='color:#111;'> 11.17KB </span>","children":null,"spread":false},{"title":"README.md <span style='color:#111;'> 5.32KB </span>","children":null,"spread":false},{"title":"data_utils","children":[{"title":"file_utils.py <span style='color:#111;'> 8.24KB </span>","children":null,"spread":false},{"title":"samplers.py <span style='color:#111;'> 3.44KB </span>","children":null,"spread":false},{"title":"tokenization.py <span style='color:#111;'> 31.55KB </span>","children":null,"spread":false},{"title":"datasets.py <span style='color:#111;'> 24.96KB </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 4.66KB </span>","children":null,"spread":false},{"title":"lazy_loader.py <span style='color:#111;'> 6.71KB </span>","children":null,"spread":false},{"title":"tf_dl.py <span style='color:#111;'> 4.13KB </span>","children":null,"spread":false},{"title":"wordpiece.py <span style='color:#111;'> 15.23KB </span>","children":null,"spread":false},{"title":"corpora.py <span style='color:#111;'> 1.32KB </span>","children":null,"spread":false}],"spread":true}],"spread":false}],"spread":true}]