[{"title":"(52个子文件232KB)Transformer_models-源码","children":[{"title":"transformer_models-master","children":[{"title":"docs","children":[{"title":"bert-intro.md <span style='color:#111;'>5.01KB</span>","children":null,"spread":false},{"title":"artifacts.md <span style='color:#111;'>2.63KB</span>","children":null,"spread":false},{"title":"dataprep.md <span style='color:#111;'>1.13KB</span>","children":null,"spread":false}],"spread":true},{"title":"huggingface_models","children":[{"title":"modeling_electra.py <span style='color:#111;'>21.83KB</span>","children":null,"spread":false}],"spread":true},{"title":"pretrain","children":[{"title":"PyTorch","children":[{"title":"models.py <span style='color:#111;'>10.96KB</span>","children":null,"spread":false},{"title":"text.py <span style='color:#111;'>107B</span>","children":null,"spread":false},{"title":"utils.py <span style='color:#111;'>356B</span>","children":null,"spread":false},{"title":"azureml_adapter.py <span style='color:#111;'>1.48KB</span>","children":null,"spread":false},{"title":"logger.py <span style='color:#111;'>697B</span>","children":null,"spread":false},{"title":"train.py <span style='color:#111;'>24.15KB</span>","children":null,"spread":false},{"title":"dataset.py <span style='color:#111;'>6.72KB</span>","children":null,"spread":false},{"title":"benchmark.py <span style='color:#111;'>1.24KB</span>","children":null,"spread":false},{"title":"configuration.py <span style='color:#111;'>1.71KB</span>","children":null,"spread":false},{"title":"dataprep","children":[{"title":"create_pretraining.py <span style='color:#111;'>4.01KB</span>","children":null,"spread":false},{"title":"single_line_doc_file_creation.py <span style='color:#111;'>905B</span>","children":null,"spread":false},{"title":"split_data_into_files.py <span style='color:#111;'>1.54KB</span>","children":null,"spread":false},{"title":"sentence_segmentation.py <span style='color:#111;'>612B</span>","children":null,"spread":false}],"spread":false},{"title":"distributed_apex.py <span style='color:#111;'>24.49KB</span>","children":null,"spread":false},{"title":"sources.py <span style='color:#111;'>9.34KB</span>","children":null,"spread":false},{"title":"checkpoint.py <span style='color:#111;'>2.45KB</span>","children":null,"spread":false},{"title":"optimization.py <span style='color:#111;'>1.17KB</span>","children":null,"spread":false},{"title":"README.md <span style='color:#111;'>341B</span>","children":null,"spread":false},{"title":"notebooks","children":[{"title":"BERT_Pretrain.ipynb <span style='color:#111;'>17.14KB</span>","children":null,"spread":false}],"spread":false}],"spread":false},{"title":"configs","children":[{"title":"bert-large-single-node.json <span style='color:#111;'>1019B</span>","children":null,"spread":false},{"title":"bert-base-single-node-rui.json <span style='color:#111;'>1.04KB</span>","children":null,"spread":false},{"title":"bert-base.json <span style='color:#111;'>987B</span>","children":null,"spread":false},{"title":"electra-small-single-node-rui.json <span style='color:#111;'>1.29KB</span>","children":null,"spread":false},{"title":"bert-base-single-node.json <span style='color:#111;'>1013B</span>","children":null,"spread":false},{"title":"bert-large.json <span style='color:#111;'>993B</span>","children":null,"spread":false}],"spread":true},{"title":"README.md <span style='color:#111;'>2.34KB</span>","children":null,"spread":false},{"title":"scripts","children":[{"title":"single_node_bert.lsf <span style='color:#111;'>1.46KB</span>","children":null,"spread":false},{"title":"single_node_electra.lsf <span style='color:#111;'>1.53KB</span>","children":null,"spread":false}],"spread":true}],"spread":true},{"title":"finetune","children":[{"title":"run_classifier_azureml.py <span style='color:#111;'>45.75KB</span>","children":null,"spread":false},{"title":"evaluate_squad.py <span style='color:#111;'>3.34KB</span>","children":null,"spread":false},{"title":"PyTorch","children":[{"title":"run_finetuning_glue.py <span style='color:#111;'>37.09KB</span>","children":null,"spread":false},{"title":"models.py <span style='color:#111;'>4.96KB</span>","children":null,"spread":false},{"title":"azureml_bert_util.py <span style='color:#111;'>4.65KB</span>","children":null,"spread":false},{"title":"notebooks","children":[{"title":"Pretrained-BERT-GLUE.ipynb <span style='color:#111;'>19.20KB</span>","children":null,"spread":false},{"title":"BERT_Eval_GLUE.ipynb <span style='color:#111;'>13.44KB</span>","children":null,"spread":false},{"title":"Pretrained-BERT-NER.ipynb <span style='color:#111;'>46.99KB</span>","children":null,"spread":false},{"title":"BERT_Eval_SQUAD.ipynb <span style='color:#111;'>12.66KB</span>","children":null,"spread":false}],"spread":true},{"title":"run_finetuning_glue_horovodrun.py <span style='color:#111;'>34.22KB</span>","children":null,"spread":false},{"title":"dockerfile <span style='color:#111;'>317B</span>","children":null,"spread":false}],"spread":true},{"title":"run_squad_azureml.py <span style='color:#111;'>45.84KB</span>","children":null,"spread":false},{"title":"README.md <span style='color:#111;'>9.75KB</span>","children":null,"spread":false},{"title":"scripts","children":[{"title":"single_node_bert_fine_tuning.lsf <span style='color:#111;'>2.51KB</span>","children":null,"spread":false},{"title":"single_node_electra_fine_tuning.lsf <span style='color:#111;'>2.55KB</span>","children":null,"spread":false}],"spread":true},{"title":"TensorFlow","children":[{"title":"run_classifier.py <span style='color:#111;'>32.15KB</span>","children":null,"spread":false},{"title":"download_model_and_dataset.py <span style='color:#111;'>3.04KB</span>","children":null,"spread":false},{"title":"notebooks","children":[{"title":"Tensorflow-BERT-AzureML.ipynb <span style='color:#111;'>139.93KB</span>","children":null,"spread":false}],"spread":false}],"spread":true}],"spread":true},{"title":"LICENSE <span style='color:#111;'>1.13KB</span>","children":null,"spread":false},{"title":"README.md <span style='color:#111;'>6.31KB</span>","children":null,"spread":false}],"spread":true}],"spread":true}]