Coverage report: 74%

Files Functions Classes

coverage.py v7.13.5, created at 2026-04-21 23:06 +0000

      Statements   Branches   Total
File function   coverage statements missing excluded   coverage branches partial   coverage
background_sync.py _log   100% 2 0 0   100% 0 0   100%
background_sync.py iter_new_checkpoint_files   89% 9 1 0   90% 10 1   89%
background_sync.py _is_old_enough   0% 3 3 0   0% 2 0   0%
background_sync.py _is_stable   0% 7 7 0   0% 2 0   0%
background_sync.py _looks_like_valid_torch_zip   0% 5 5 0   100% 0 0   0%
background_sync.py upload_checkpoint   92% 26 2 0   88% 8 1   91%
background_sync.py sync_once   100% 5 0 0   100% 4 0   100%
background_sync.py run_sync_loop   0% 9 9 0   100% 0 0   0%
background_sync.py _read_int_env   64% 11 4 0   75% 4 1   67%
background_sync.py _read_bool_env   80% 10 2 0   83% 6 1   81%
background_sync.py run_self_check   58% 31 13 0   10% 10 1   46%
background_sync.py main   93% 27 2 0   100% 4 0   94%
background_sync.py (no function)   100% 23 0 3   100% 0 0   100%
build_validation_dataset.py _build_default_specs   100% 1 0 0   100% 0 0   100%
build_validation_dataset.py _resolve_selection_indices   73% 11 3 0   70% 10 3   71%
build_validation_dataset.py _load_specs_from_config   83% 18 3 0   70% 10 3   79%
build_validation_dataset.py _validate_specs   60% 20 8 0   50% 12 4   56%
build_validation_dataset.py _rebalance_rows_to_min_capacity   100% 0 0 1   100% 0 0   100%
build_validation_dataset.py _probe_hf_dataset_capacity   0% 19 19 0   0% 6 0   0%
build_validation_dataset.py _rebalance_rows_to_min_capacity_with_probe   100% 23 0 0   79% 14 3   92%
build_validation_dataset.py _maybe_load_kaggle_secrets   76% 17 4 0   83% 6 1   78%
build_validation_dataset.py _resolve_hf_token   0% 1 1 0   100% 0 0   0%
build_validation_dataset.py _streaming_select_rows   91% 11 1 0   83% 6 1   88%
build_validation_dataset.py _load_remote_dataset   88% 16 2 0   67% 6 2   82%
build_validation_dataset.py _load_fineweb_shard   87% 30 4 0   78% 18 4   83%
build_validation_dataset.py _materialize_pillar   0% 11 11 0   0% 4 0   0%
build_validation_dataset.py _write_manifest   0% 4 4 0   100% 0 0   0%
build_validation_dataset.py _write_kaggle_metadata   100% 5 0 0   100% 0 0   100%
build_validation_dataset.py _run_kaggle_cli   0% 9 9 0   0% 6 0   0%
build_validation_dataset.py parse_args   0% 19 19 0   100% 0 0   0%
build_validation_dataset.py main   0% 38 38 0   0% 16 0   0%
build_validation_dataset.py (no function)   100% 35 0 2   100% 0 0   100%
compare_tokenizers.py parse_args   100% 14 0 0   100% 0 0   100%
compare_tokenizers.py load_samples   100% 16 0 0   100% 10 0   100%
compare_tokenizers.py filter_samples   100% 4 0 0   100% 2 0   100%
compare_tokenizers.py format_ratio   100% 6 0 0   100% 4 0   100%
compare_tokenizers.py normalize_whitespace   100% 1 0 0   100% 0 0   100%
compare_tokenizers.py count_byte_markers   100% 1 0 0   100% 0 0   100%
compare_tokenizers.py compare_tokenizers   100% 46 0 0   93% 14 1   98%
compare_tokenizers.py evaluate_regressions   97% 31 1 0   97% 36 1   97%
compare_tokenizers.py main   59% 17 7 0   38% 8 3   52%
compare_tokenizers.py (no function)   100% 20 0 2   100% 0 0   100%
context_config.py resolve_context_length   100% 8 0 0   100% 2 0   100%
context_config.py (no function)   100% 5 0 0   100% 0 0   100%
data.py get_text_column   100% 6 0 0   100% 8 0   100%
data.py create_infinite_stream   100% 2 0 0   100% 0 0   100%
data.py extract_text_from_row   100% 23 0 0   92% 26 2   96%
data.py packed_token_stream   100% 25 0 0   79% 14 3   92%
data.py AgenticDataMixture.__init__   100% 4 0 0   100% 0 0   100%
data.py AgenticDataMixture.__iter__   100% 3 0 0   100% 0 0   100%
data.py packed_collate_fn   100% 10 0 0   100% 2 0   100%
data.py create_dataloaders   74% 23 6 0   50% 10 1   67%
data.py (no function)   100% 16 0 0   100% 0 0   100%
dist_utils.py setup_distributed   100% 30 0 0   100% 10 0   100%
dist_utils.py cleanup_distributed   100% 2 0 0   100% 2 0   100%
dist_utils.py is_main_process   100% 3 0 0   100% 2 0   100%
dist_utils.py wrap_model_ddp   100% 3 0 0   100% 2 0   100%
dist_utils.py unwrap_model   100% 3 0 0   100% 2 0   100%
dist_utils.py barrier   100% 2 0 0   100% 2 0   100%
dist_utils.py get_world_size   100% 3 0 0   100% 2 0   100%
dist_utils.py (no function)   100% 14 0 0   100% 0 0   100%
gpu_smoke_test.py main   100% 14 0 0   100% 2 0   100%
gpu_smoke_test.py (no function)   100% 3 0 2   100% 0 0   100%
inference.py resolve_model_settings   100% 6 0 0   100% 4 0   100%
inference.py generate   100% 10 0 0   100% 0 0   100%
inference.py main   100% 15 0 0   100% 0 0   100%
inference.py (no function)   100% 11 0 2   100% 0 0   100%
kaggle_watchdog.py _candidate_repo_dirs   0% 10 10 0   0% 4 0   0%
kaggle_watchdog.py set_repo_directory   100% 7 0 0   100% 4 0   100%
kaggle_watchdog.py _load_kaggle_secrets   0% 3 3 0   100% 0 0   0%
kaggle_watchdog.py _load_colab_secrets   0% 2 2 0   100% 0 0   0%
kaggle_watchdog.py load_runtime_secrets   90% 21 2 0   100% 10 0   94%
kaggle_watchdog.py load_kaggle_secrets   100% 1 0 0   100% 0 0   100%
kaggle_watchdog.py start_background_sync   100% 8 0 0   100% 0 0   100%
kaggle_watchdog.py run_sync_self_check   100% 9 0 0   100% 0 0   100%
kaggle_watchdog.py main   100% 11 0 0   100% 4 0   100%
kaggle_watchdog.py (no function)   100% 14 0 2   100% 0 0   100%
model.py maybe_autocast   42% 12 7 0   30% 10 3   36%
model.py _mamba_chunk_scan_combined_fallback   100% 36 0 0   75% 12 3   94%
model.py _ternary_quant_kernel   0% 10 10 0   100% 0 0   0%
model.py TernaryQuantizeSTE.forward   50% 10 5 0   50% 2 1   50%
model.py TernaryQuantizeSTE.backward   100% 1 0 0   100% 0 0   100%
model.py weight_quant   100% 1 0 0   100% 0 0   100%
model.py activation_quant   100% 4 0 0   100% 0 0   100%
model.py BitLinear.__init__   100% 10 0 0   100% 2 0   100%
model.py BitLinear._clear_inference_cache   100% 2 0 0   100% 0 0   100%
model.py BitLinear._get_quantized_weight   100% 9 0 0   100% 4 0   100%
model.py BitLinear.prepare_for_inference   100% 3 0 0   100% 0 0   100%
model.py BitLinear.train   100% 3 0 0   100% 2 0   100%
model.py BitLinear.forward   100% 4 0 0   100% 0 0   100%
model.py RMSNorm.__init__   100% 3 0 0   100% 0 0   100%
model.py RMSNorm.forward   100% 2 0 0   100% 0 0   100%
model.py AttentionBlock.__init__   100% 10 0 0   100% 0 0   100%
model.py AttentionBlock.forward   88% 32 4 0   80% 10 2   86%
model.py AttentionBlock.prefill   77% 13 3 0   50% 2 1   73%
model.py AttentionBlock.step   79% 14 3 0   50% 2 1   75%
model.py BitMambaBlock.__init__   100% 26 0 0   100% 0 0   100%
model.py BitMambaBlock.forward   93% 15 1 0   50% 2 1   88%
model.py BitMambaBlock.prefill   95% 20 1 0   75% 4 1   92%
model.py BitMambaBlock.step   76% 46 11 0   50% 4 2   74%
model.py BitMambaLLM.__init__   100% 18 0 0   100% 6 0   100%
model.py BitMambaLLM._backbone   100% 7 0 0   100% 4 0   100%
model.py BitMambaLLM.forward   75% 4 1 0   50% 2 1   67%
model.py BitMambaLLM.forward_hidden   100% 1 0 0   100% 0 0   100%
model.py BitMambaLLM.prepare_for_inference   100% 5 0 0   100% 4 0   100%
model.py BitMambaLLM.generate   100% 22 0 0   100% 10 0   100%
model.py chunked_cross_entropy   100% 11 0 0   100% 4 0   100%
model.py (no function)   94% 70 4 0   50% 4 2   92%
optim.py _resolve_adam_class   22% 9 7 0   25% 4 1   23%
optim.py Muon.__init__   100% 3 0 0   100% 0 0   100%
optim.py Muon._get_ns_workspace   100% 5 0 0   100% 2 0   100%
optim.py Muon.step   94% 33 2 0   93% 14 1   94%
optim.py setup_mamba_optimizers   100% 13 0 0   88% 8 1   95%
optim.py FGWSD_Scheduler.__init__   100% 10 0 0   100% 2 0   100%
optim.py FGWSD_Scheduler.get_lr_and_ctx   100% 11 0 0   100% 8 0   100%
optim.py FGWSD_Scheduler.step   100% 5 0 0   100% 2 0   100%
optim.py (no function)   100% 13 0 0   100% 0 0   100%
rl_train.py collect_data_files   100% 6 0 0   83% 6 1   92%
rl_train.py compute_format_reward   100% 6 0 0   100% 4 0   100%
rl_train.py compute_accuracy_reward   100% 6 0 0   100% 4 0   100%
rl_train.py compute_conciseness_penalty   100% 7 0 0   100% 4 0   100%
rl_train.py _extract_thought_and_answer   100% 9 0 0   100% 4 0   100%
rl_train.py compute_rewards   100% 8 0 0   100% 2 0   100%
rl_train.py filter_problems_on_policy   72% 29 8 0   67% 12 2   71%
rl_train.py run_rl_steps   80% 79 16 0   47% 34 6   70%
rl_train.py main   0% 22 22 0   0% 6 0   0%
rl_train.py (no function)   100% 31 0 2   100% 0 0   100%
sft_data.py _first_token_id   100% 12 0 0   90% 10 1   95%
sft_data.py SFTChatDataset.__init__   71% 42 12 0   57% 28 6   66%
sft_data.py SFTChatDataset.__len__   100% 1 0 0   50% 2 1   67%
sft_data.py SFTChatDataset._row_to_messages   100% 20 0 0   100% 14 0   100%
sft_data.py SFTChatDataset.__getitem__   100% 27 0 0   83% 12 2   95%
sft_data.py sft_collate_fn   100% 11 0 0   100% 4 0   100%
sft_data.py create_sft_dataloader   85% 20 3 0   75% 8 2   82%
sft_data.py (no function)   100% 17 0 0   100% 0 0   100%
sft_train.py run_sft_stage   93% 68 5 0   67% 24 8   86%
sft_train.py main   0% 18 18 0   0% 6 0   0%
sft_train.py (no function)   100% 20 0 2   100% 0 0   100%
synth_data.py truncate_source   100% 5 0 0   100% 2 0   100%
synth_data.py iter_source_texts   88% 17 2 0   69% 16 5   79%
synth_data.py run_pipeline   91% 33 3 0   62% 8 3   85%
synth_data.py main   0% 11 11 0   100% 0 0   0%
synth_data.py (no function)   100% 16 0 2   100% 0 0   100%
train.py _parse_runtime_args   0% 4 4 0   100% 0 0   0%
train.py _resolve_amp_dtype   0% 7 7 0   0% 6 0   0%
train.py create_seq_idx_batch   100% 12 0 0   100% 6 0   100%
train.py run_training_steps   84% 81 13 0   73% 26 5   81%
train.py load_latest_checkpoint   0% 14 14 0   0% 2 0   0%
train.py main   0% 38 38 0   0% 14 0   0%
train.py (no function)   83% 42 7 2   25% 4 1   78%
train_tokenizer.py _resolve_profile   100% 6 0 0   100% 4 0   100%
train_tokenizer.py _profile_default   100% 1 0 0   100% 0 0   100%
train_tokenizer.py _corpus_bytes_for_ram   100% 2 0 0   100% 0 0   100%
train_tokenizer.py _resolve_backend   88% 8 1 0   83% 6 1   86%
train_tokenizer.py get_text_column   100% 7 0 0   100% 8 0   100%
train_tokenizer.py maybe_trim_text   100% 8 0 0   100% 6 0   100%
train_tokenizer.py iter_data_files   100% 5 0 0   100% 6 0   100%
train_tokenizer.py iter_text_from_rows   100% 10 0 0   100% 8 0   100%
train_tokenizer.py iter_jsonl_rows   100% 12 0 0   100% 6 0   100%
train_tokenizer.py iter_json_texts   0% 2 2 0   100% 0 0   0%
train_tokenizer.py iter_parquet_texts   100% 12 0 0   100% 8 0   100%
train_tokenizer.py iter_file_texts   88% 8 1 0   75% 4 1   83%
train_tokenizer.py batch_iterator   100% 24 0 0   92% 12 1   97%
train_tokenizer.py _prune_counter   100% 5 0 0   100% 2 0   100%
train_tokenizer.py _iter_training_pieces   100% 7 0 0   100% 6 0   100%
train_tokenizer.py _normalize_text_for_training   100% 19 0 0   92% 12 1   97%
train_tokenizer.py _count_word_frequencies   0% 25 25 0   0% 12 0   0%
train_tokenizer.py _build_allowed_words   100% 8 0 0   100% 2 0   100%
train_tokenizer.py _filtered_batch_iterator   0% 26 26 0   0% 14 0   0%
train_tokenizer.py _run_sentencepiece_backend   88% 17 2 0   50% 8 4   76%
train_tokenizer.py _train_hf_backend   0% 13 13 0   100% 0 0   0%
train_tokenizer.py main   0% 5 5 0   0% 2 0   0%
train_tokenizer.py (no function)   100% 49 0 2   100% 0 0   100%
train_tokenizer_spm.py _resolve_profile   83% 12 2 0   80% 10 2   82%
train_tokenizer_spm.py _parse_domain_map   77% 13 3 0   62% 8 3   71%
train_tokenizer_spm.py _normalize_domain_weights   67% 9 3 0   62% 8 3   65%
train_tokenizer_spm.py _calculate_domain_quotas   60% 10 4 0   33% 6 2   50%
train_tokenizer_spm.py _load_profile_registry   23% 13 10 0   12% 8 1   19%
train_tokenizer_spm.py _resolve_profile_settings   74% 19 5 0   70% 10 1   72%
train_tokenizer_spm.py _auto_tune_input_sentence_size   79% 24 5 0   80% 10 2   79%
train_tokenizer_spm.py parse_args   100% 16 0 0   100% 0 0   100%
train_tokenizer_spm.py _infer_domain   100% 10 0 0   100% 8 0   100%
train_tokenizer_spm.py _build_temp_corpus   97% 33 1 0   94% 18 1   96%
train_tokenizer_spm.py _write_run_manifest   0% 4 4 0   100% 0 0   0%
train_tokenizer_spm.py _resolve_model_max_length   100% 9 0 0   75% 4 1   92%
train_tokenizer_spm.py _export_hf_tokenizer   82% 40 7 6   100% 0 0   82%
train_tokenizer_spm.py main   100% 31 0 0   100% 6 0   100%
train_tokenizer_spm.py (no function)   100% 26 0 2   100% 0 0   100%
upscale.py upscaler   98% 41 1 0   75% 12 3   92%
upscale.py (no function)   100% 4 0 3   100% 0 0   100%
validate.py resolve_model_config   0% 8 8 0   0% 6 0   0%
validate.py parse_checkpoint_step   100% 5 0 0   100% 2 0   100%
validate.py resolve_default_checkpoint_dir   0% 1 1 0   100% 0 0   0%
validate.py discover_checkpoints   0% 13 13 0   0% 8 0   0%
validate.py _resolve_existing_path   86% 7 1 0   75% 4 1   82%
validate.py load_manifest_pillars   88% 16 2 0   67% 6 2   82%
validate.py iter_token_windows   70% 10 3 0   62% 8 3   67%
validate.py _run_loss_batch   0% 12 12 0   0% 2 0   0%
validate.py evaluate_pillar   0% 38 38 0   0% 16 0   0%
validate.py evaluate_checkpoint   25% 32 24 0   25% 4 1   25%
validate.py parse_args   0% 18 18 0   100% 0 0   0%
validate.py main   0% 23 23 0   0% 6 0   0%
validate.py (no function)   100% 31 0 2   100% 0 0   100%
Total     76% 3014 710 37   68% 1044 135   74%

No items found using the specified filter.