[{"title":"( 92 个子文件 387KB ) SpanBERT:使用和评估SpanBERT的代码","children":[{"title":"SpanBERT-master","children":[{"title":"pretraining","children":[{"title":"fairseq","children":[{"title":"models","children":[{"title":"fairseq_model.py <span style='color:#111;'> 7.04KB </span>","children":null,"spread":false},{"title":"hf_bert.py <span style='color:#111;'> 38.71KB </span>","children":null,"spread":false},{"title":"fairseq_encoder.py <span style='color:#111;'> 1.45KB </span>","children":null,"spread":false},{"title":"fairseq_incremental_decoder.py <span style='color:#111;'> 3.18KB </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 4.20KB </span>","children":null,"spread":false},{"title":"distributed_fairseq_model.py <span style='color:#111;'> 2.91KB </span>","children":null,"spread":false},{"title":"fairseq_decoder.py <span style='color:#111;'> 2.01KB </span>","children":null,"spread":false},{"title":"pair_bert.py <span style='color:#111;'> 42.04KB </span>","children":null,"spread":false}],"spread":true},{"title":"options.py <span style='color:#111;'> 18.57KB </span>","children":null,"spread":false},{"title":"optim","children":[{"title":"nag.py <span style='color:#111;'> 2.52KB </span>","children":null,"spread":false},{"title":"fairseq_optimizer.py <span style='color:#111;'> 3.16KB </span>","children":null,"spread":false},{"title":"adam.py <span style='color:#111;'> 5.49KB </span>","children":null,"spread":false},{"title":"bert_adam.py <span style='color:#111;'> 7.94KB </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 1.70KB </span>","children":null,"spread":false},{"title":"sgd.py <span style='color:#111;'> 1.03KB </span>","children":null,"spread":false},{"title":"fp16_optimizer.py <span style='color:#111;'> 6.39KB </span>","children":null,"spread":false},{"title":"adagrad.py <span style='color:#111;'> 1.12KB </span>","children":null,"spread":false},{"title":"lr_scheduler","children":[{"title":"cosine_lr_scheduler.py <span style='color:#111;'> 4.37KB </span>","children":null,"spread":false},{"title":"polynomial_decay_schedule.py <span style='color:#111;'> 2.76KB </span>","children":null,"spread":false},{"title":"reduce_lr_on_plateau.py <span style='color:#111;'> 1.71KB </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 1.30KB </span>","children":null,"spread":false},{"title":"fairseq_lr_scheduler.py <span style='color:#111;'> 1.40KB </span>","children":null,"spread":false},{"title":"fixed_schedule.py <span style='color:#111;'> 2.35KB </span>","children":null,"spread":false},{"title":"inverse_square_root_schedule.py <span style='color:#111;'> 2.92KB </span>","children":null,"spread":false},{"title":"triangular_lr_scheduler.py <span style='color:#111;'> 2.57KB </span>","children":null,"spread":false}],"spread":false}],"spread":true},{"title":"meters.py <span style='color:#111;'> 3.73KB </span>","children":null,"spread":false},{"title":"tokenizer.py <span style='color:#111;'> 4.41KB </span>","children":null,"spread":false},{"title":"utils.py <span style='color:#111;'> 15.94KB </span>","children":null,"spread":false},{"title":"tasks","children":[{"title":"fairseq_task.py <span style='color:#111;'> 5.94KB </span>","children":null,"spread":false},{"title":"span_bert.py <span style='color:#111;'> 7.63KB </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 2.32KB </span>","children":null,"spread":false}],"spread":true},{"title":"data","children":[{"title":"dictionary.py <span style='color:#111;'> 7.28KB </span>","children":null,"spread":false},{"title":"iterators.py <span style='color:#111;'> 8.09KB </span>","children":null,"spread":false},{"title":"fairseq_dataset.py <span style='color:#111;'> 1.70KB </span>","children":null,"spread":false},{"title":"masking.py <span style='color:#111;'> 12.40KB </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 874B </span>","children":null,"spread":false},{"title":"span_bert_dataset.py <span style='color:#111;'> 19.21KB </span>","children":null,"spread":false},{"title":"indexed_dataset.py <span style='color:#111;'> 8.63KB </span>","children":null,"spread":false},{"title":"data_utils.py <span style='color:#111;'> 6.08KB </span>","children":null,"spread":false},{"title":"no_nsp_span_bert_dataset.py <span style='color:#111;'> 9.81KB </span>","children":null,"spread":false}],"spread":true},{"title":"multiprocessing_pdb.py <span style='color:#111;'> 1.01KB </span>","children":null,"spread":false},{"title":"distributed_utils.py <span style='color:#111;'> 4.57KB </span>","children":null,"spread":false},{"title":"criterions","children":[{"title":"fairseq_criterion.py <span style='color:#111;'> 1.68KB </span>","children":null,"spread":false},{"title":"cross_entropy.py <span style='color:#111;'> 2.43KB </span>","children":null,"spread":false},{"title":"label_smoothed_cross_entropy.py <span style='color:#111;'> 3.12KB </span>","children":null,"spread":false},{"title":"mlm_loss.py <span style='color:#111;'> 2.67KB </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 1.61KB </span>","children":null,"spread":false},{"title":"bert_loss.py <span style='color:#111;'> 3.39KB </span>","children":null,"spread":false},{"title":"spanbert_loss.py <span style='color:#111;'> 3.91KB </span>","children":null,"spread":false},{"title":"composite_loss.py <span style='color:#111;'> 2.89KB </span>","children":null,"spread":false},{"title":"mlm_nsp_sbo_loss.py <span style='color:#111;'> 4.57KB </span>","children":null,"spread":false}],"spread":true},{"title":"__init__.py <span style='color:#111;'> 512B </span>","children":null,"spread":false},{"title":"trainer.py <span style='color:#111;'> 14.85KB </span>","children":null,"spread":false},{"title":"legacy_distributed_data_parallel.py <span style='color:#111;'> 4.76KB </span>","children":null,"spread":false},{"title":"progress_bar.py <span style='color:#111;'> 6.91KB </span>","children":null,"spread":false},{"title":"modules","children":[{"title":"grad_multiply.py <span style='color:#111;'> 550B </span>","children":null,"spread":false},{"title":"bidirectional_multihead_attention.py <span style='color:#111;'> 5.97KB </span>","children":null,"spread":false},{"title":"learned_positional_embedding.py <span style='color:#111;'> 1.39KB </span>","children":null,"spread":false},{"title":"sinusoidal_positional_embedding.py <span style='color:#111;'> 3.71KB </span>","children":null,"spread":false},{"title":"downsampled_multihead_attention.py <span style='color:#111;'> 9.69KB </span>","children":null,"spread":false},{"title":"beamable_mm.py <span style='color:#111;'> 1.84KB </span>","children":null,"spread":false},{"title":"multihead_attention.py <span style='color:#111;'> 14.08KB </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 1.23KB </span>","children":null,"spread":false},{"title":"adaptive_softmax.py <span style='color:#111;'> 7.41KB </span>","children":null,"spread":false},{"title":"highway.py <span style='color:#111;'> 1.82KB </span>","children":null,"spread":false},{"title":"scalar_bias.py <span style='color:#111;'> 996B </span>","children":null,"spread":false},{"title":"adaptive_input.py <span style='color:#111;'> 2.39KB </span>","children":null,"spread":false},{"title":"adaptive_inputs.py <span style='color:#111;'> 2.39KB </span>","children":null,"spread":false}],"spread":false}],"spread":false},{"title":"train.py <span style='color:#111;'> 14.19KB </span>","children":null,"spread":false},{"title":"distributed_train.py <span style='color:#111;'> 1.85KB </span>","children":null,"spread":false},{"title":"multiprocessing_train.py <span style='color:#111;'> 2.93KB </span>","children":null,"spread":false},{"title":"dict.txt <span style='color:#111;'> 374.44KB </span>","children":null,"spread":false},{"title":"preprocess.py <span style='color:#111;'> 11.07KB </span>","children":null,"spread":false},{"title":".gitignore <span style='color:#111;'> 1.21KB </span>","children":null,"spread":false},{"title":"README.md <span style='color:#111;'> 2.12KB </span>","children":null,"spread":false},{"title":"bpe_tokenize.py <span style='color:#111;'> 2.08KB </span>","children":null,"spread":false}],"spread":true},{"title":"LICENSE <span style='color:#111;'> 18.88KB </span>","children":null,"spread":false},{"title":"CONTRIBUTING.md <span style='color:#111;'> 1.22KB </span>","children":null,"spread":false},{"title":"code","children":[{"title":"run_glue.py <span style='color:#111;'> 39.67KB </span>","children":null,"spread":false},{"title":"pytorch_pretrained_bert","children":[{"title":"tokenization.py <span style='color:#111;'> 16.60KB </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 646B </span>","children":null,"spread":false},{"title":"optimization.py <span style='color:#111;'> 7.84KB </span>","children":null,"spread":false},{"title":"file_utils.py <span style='color:#111;'> 8.98KB </span>","children":null,"spread":false},{"title":"modeling.py <span style='color:#111;'> 58.67KB </span>","children":null,"spread":false}],"spread":true},{"title":"run_tacred.py <span style='color:#111;'> 26.49KB </span>","children":null,"spread":false},{"title":"download_finetuned.sh <span style='color:#111;'> 264B </span>","children":null,"spread":false},{"title":"run_mrqa.py <span style='color:#111;'> 41.85KB </span>","children":null,"spread":false},{"title":"mrqa_official_eval.py <span style='color:#111;'> 4.87KB </span>","children":null,"spread":false},{"title":"run_squad.py <span style='color:#111;'> 49.73KB </span>","children":null,"spread":false}],"spread":true},{"title":"requirements.txt <span style='color:#111;'> 581B </span>","children":null,"spread":false},{"title":"CODE_OF_CONDUCT.md <span style='color:#111;'> 243B </span>","children":null,"spread":false},{"title":"README.md <span style='color:#111;'> 5.96KB </span>","children":null,"spread":false}],"spread":true}],"spread":true}]