five

YnezT/PathGen-shortest-path

收藏
Hugging Face2026-04-17 更新2026-04-26 收录
下载链接:
https://hf-mirror.com/datasets/YnezT/PathGen-shortest-path
下载链接
链接失效反馈
官方服务:
资源简介:
--- dataset_info: - config_name: cov_div_d128_c010 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 48666315 num_examples: 23040 download_size: 8170905 dataset_size: 48666315 - config_name: cov_div_d128_c015 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 485320670 num_examples: 221233 download_size: 54891281 dataset_size: 485320670 - config_name: cov_div_d128_c020 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 446869698 num_examples: 213514 download_size: 57534648 dataset_size: 446869698 - config_name: cov_div_d128_c030 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 556914984 num_examples: 260705 download_size: 76897673 dataset_size: 556914984 - config_name: cov_div_d128_c040 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 552764792 num_examples: 264034 download_size: 81835111 dataset_size: 552764792 - config_name: cov_div_d128_c060 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 561026913 num_examples: 268363 download_size: 90534242 dataset_size: 561026913 - config_name: cov_div_d128_c080 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 380438295 num_examples: 184320 download_size: 72009037 dataset_size: 380438295 - config_name: cov_div_d128_c100 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 474279217 num_examples: 230400 download_size: 90318588 dataset_size: 474279217 - config_name: cov_div_d16_c005 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 380070784 num_examples: 155122 download_size: 20991732 dataset_size: 380070784 - config_name: cov_div_d16_c010 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 364028995 num_examples: 161830 download_size: 23286399 dataset_size: 364028995 - config_name: cov_div_d16_c015 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 421681998 num_examples: 181432 download_size: 28950692 dataset_size: 421681998 - config_name: cov_div_d16_c020 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 402259930 num_examples: 181724 download_size: 29533367 dataset_size: 402259930 - config_name: cov_div_d16_c030 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 429716392 num_examples: 191047 download_size: 33307915 dataset_size: 429716392 - config_name: cov_div_d16_c040 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 429616389 num_examples: 193734 download_size: 35462098 dataset_size: 429616389 - config_name: cov_div_d16_c060 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 461470473 num_examples: 210208 download_size: 40221258 dataset_size: 461470473 - config_name: cov_div_d16_c080 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 445121866 num_examples: 205299 download_size: 42527804 dataset_size: 445121866 - config_name: cov_div_d16_c100 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 449743357 num_examples: 208111 download_size: 52716617 dataset_size: 449743357 - config_name: cov_div_d1_c005 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 264983563 num_examples: 105756 download_size: 14378990 dataset_size: 264983563 - config_name: cov_div_d1_c010 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 295619557 num_examples: 113604 download_size: 15839394 dataset_size: 295619557 - config_name: cov_div_d1_c015 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 272426445 num_examples: 111015 download_size: 14881381 dataset_size: 272426445 - config_name: cov_div_d1_c020 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 312353033 num_examples: 127177 download_size: 17366817 dataset_size: 312353033 - config_name: cov_div_d1_c030 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 335923433 num_examples: 134616 download_size: 18587923 dataset_size: 335923433 - config_name: cov_div_d1_c040 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 335244451 num_examples: 137713 download_size: 18546672 dataset_size: 335244451 - config_name: cov_div_d1_c060 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 366423359 num_examples: 151817 download_size: 20526830 dataset_size: 366423359 - config_name: cov_div_d1_c080 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 383590353 num_examples: 160504 download_size: 21656024 dataset_size: 383590353 - config_name: cov_div_d1_c100 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 380486403 num_examples: 160154 download_size: 22247910 dataset_size: 380486403 - config_name: cov_div_d2_c005 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 256805771 num_examples: 107219 download_size: 13986511 dataset_size: 256805771 - config_name: cov_div_d2_c010 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 318020690 num_examples: 127962 download_size: 17123934 dataset_size: 318020690 - config_name: cov_div_d2_c015 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 341997945 num_examples: 141365 download_size: 18787621 dataset_size: 341997945 - config_name: cov_div_d2_c020 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 339626633 num_examples: 140544 download_size: 19007935 dataset_size: 339626633 - config_name: cov_div_d2_c030 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 356962346 num_examples: 147197 download_size: 19961452 dataset_size: 356962346 - config_name: cov_div_d2_c040 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 377526547 num_examples: 158415 download_size: 21493697 dataset_size: 377526547 - config_name: cov_div_d2_c060 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 400739981 num_examples: 168504 download_size: 24438267 dataset_size: 400739981 - config_name: cov_div_d2_c080 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 395382208 num_examples: 170111 download_size: 25594281 dataset_size: 395382208 - config_name: cov_div_d2_c100 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 402927385 num_examples: 174069 download_size: 27076922 dataset_size: 402927385 - config_name: cov_div_d32_c005 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 422728626 num_examples: 175457 download_size: 26846539 dataset_size: 422728626 - config_name: cov_div_d32_c010 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 426749157 num_examples: 183511 download_size: 30728331 dataset_size: 426749157 - config_name: cov_div_d32_c015 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 422362922 num_examples: 191424 download_size: 32947724 dataset_size: 422362922 - config_name: cov_div_d32_c020 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 439528282 num_examples: 196208 download_size: 36093313 dataset_size: 439528282 - config_name: cov_div_d32_c030 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 467189094 num_examples: 210842 download_size: 40151327 dataset_size: 467189094 - config_name: cov_div_d32_c040 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 446643211 num_examples: 205289 download_size: 42605641 dataset_size: 446643211 - config_name: cov_div_d32_c060 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 475275385 num_examples: 219934 download_size: 57798751 dataset_size: 475275385 - config_name: cov_div_d32_c080 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 453857701 num_examples: 213649 download_size: 59963913 dataset_size: 453857701 - config_name: cov_div_d32_c100 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 459758865 num_examples: 217032 download_size: 64456945 dataset_size: 459758865 - config_name: cov_div_d4_c005 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 310307261 num_examples: 121369 download_size: 16885874 dataset_size: 310307261 - config_name: cov_div_d4_c010 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 353879964 num_examples: 142939 download_size: 19660037 dataset_size: 353879964 - config_name: cov_div_d4_c015 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 376064771 num_examples: 155797 download_size: 20953054 dataset_size: 376064771 - config_name: cov_div_d4_c020 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 382037710 num_examples: 159606 download_size: 21814030 dataset_size: 382037710 - config_name: cov_div_d4_c030 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 392365665 num_examples: 164595 download_size: 23549870 dataset_size: 392365665 - config_name: cov_div_d4_c040 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 392752170 num_examples: 170032 download_size: 25472589 dataset_size: 392752170 - config_name: cov_div_d4_c060 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 411515626 num_examples: 178785 download_size: 28372226 dataset_size: 411515626 - config_name: cov_div_d4_c080 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 420805441 num_examples: 183805 download_size: 31055184 dataset_size: 420805441 - config_name: cov_div_d4_c100 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 421305097 num_examples: 187736 download_size: 31857315 dataset_size: 421305097 - config_name: cov_div_d64_c005 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 406456685 num_examples: 183925 download_size: 29736780 dataset_size: 406456685 - config_name: cov_div_d64_c010 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 437934872 num_examples: 197070 download_size: 36400444 dataset_size: 437934872 - config_name: cov_div_d64_c015 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 464179980 num_examples: 210083 download_size: 40407773 dataset_size: 464179980 - config_name: cov_div_d64_c020 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 449971117 num_examples: 205822 download_size: 42242380 dataset_size: 449971117 - config_name: cov_div_d64_c030 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 468630976 num_examples: 220607 download_size: 53287413 dataset_size: 468630976 - config_name: cov_div_d64_c040 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 460942204 num_examples: 214968 download_size: 60614150 dataset_size: 460942204 - config_name: cov_div_d64_c060 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 555830840 num_examples: 260520 download_size: 77390744 dataset_size: 555830840 - config_name: cov_div_d64_c080 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 553786004 num_examples: 263867 download_size: 81965077 dataset_size: 553786004 - config_name: cov_div_d64_c100 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 467688123 num_examples: 223724 download_size: 75936351 dataset_size: 467688123 - config_name: cov_div_d8_c005 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 342825727 num_examples: 144590 download_size: 18915848 dataset_size: 342825727 - config_name: cov_div_d8_c010 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 396243588 num_examples: 162108 download_size: 22192357 dataset_size: 396243588 - config_name: cov_div_d8_c015 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 395768564 num_examples: 168877 download_size: 24023438 dataset_size: 395768564 - config_name: cov_div_d8_c020 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 409122523 num_examples: 173655 download_size: 26374269 dataset_size: 409122523 - config_name: cov_div_d8_c030 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 413715017 num_examples: 180654 download_size: 28571352 dataset_size: 413715017 - config_name: cov_div_d8_c040 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 419593262 num_examples: 183676 download_size: 30982163 dataset_size: 419593262 - config_name: cov_div_d8_c060 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 431660674 num_examples: 192599 download_size: 33572234 dataset_size: 431660674 - config_name: cov_div_d8_c080 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 425870730 num_examples: 193828 download_size: 35124770 dataset_size: 425870730 - config_name: cov_div_d8_c100 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 436251477 num_examples: 198134 download_size: 36674988 dataset_size: 436251477 - config_name: longshort_0_10 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 7423365 num_examples: 10000 download_size: 1920595 dataset_size: 7423365 - config_name: longshort_10_20 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 11988560 num_examples: 10000 download_size: 2632142 dataset_size: 11988560 - config_name: longshort_20_30 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 16957772 num_examples: 10000 download_size: 3258997 dataset_size: 16957772 - config_name: longshort_30_40 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 22003793 num_examples: 10000 download_size: 3864123 dataset_size: 22003793 - config_name: longshort_40_50 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 27009560 num_examples: 10000 download_size: 4319401 dataset_size: 27009560 - config_name: longshort_50_60 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 32024763 num_examples: 10000 download_size: 4564035 dataset_size: 32024763 - config_name: longshort_60_70 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 36971753 num_examples: 10000 download_size: 4871532 dataset_size: 36971753 - config_name: longshort_70_80 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 41678944 num_examples: 10000 download_size: 5110423 dataset_size: 41678944 - config_name: longshort_80_90 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 2735503 num_examples: 594 download_size: 274885 dataset_size: 2735503 - config_name: qa_c001_ans1 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 6862814 num_examples: 6446 download_size: 1625293 dataset_size: 6862814 - config_name: qa_c001_ans16 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 7748166 num_examples: 6446 download_size: 710986 dataset_size: 7748166 - config_name: qa_c001_ans2 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 6957643 num_examples: 6446 download_size: 1360523 dataset_size: 6957643 - config_name: qa_c001_ans32 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 8005622 num_examples: 6446 download_size: 587443 dataset_size: 8005622 - config_name: qa_c001_ans4 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 7180764 num_examples: 6446 download_size: 1076032 dataset_size: 7180764 - config_name: qa_c001_ans64 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 8272545 num_examples: 6446 download_size: 586306 dataset_size: 8272545 - config_name: qa_c001_ans8 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 7420808 num_examples: 6446 download_size: 803701 dataset_size: 7420808 - config_name: qa_c005_ans1 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 34333383 num_examples: 32234 download_size: 8080354 dataset_size: 34333383 - config_name: qa_c005_ans16 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 38696300 num_examples: 32234 download_size: 3515105 dataset_size: 38696300 - config_name: qa_c005_ans2 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 34935833 num_examples: 32234 download_size: 6791680 dataset_size: 34935833 - config_name: qa_c005_ans32 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 39977865 num_examples: 32245 download_size: 2916555 dataset_size: 39977865 - config_name: qa_c005_ans4 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 35836279 num_examples: 32234 download_size: 5386602 dataset_size: 35836279 - config_name: qa_c005_ans64 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 41275262 num_examples: 32234 download_size: 2855150 dataset_size: 41275262 - config_name: qa_c005_ans8 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 37142818 num_examples: 32234 download_size: 3922932 dataset_size: 37142818 - config_name: qa_c010_ans1 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 68666618 num_examples: 64469 download_size: 16140279 dataset_size: 68666618 - config_name: qa_c010_ans16 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 77291631 num_examples: 64469 download_size: 7037761 dataset_size: 77291631 - config_name: qa_c010_ans2 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 69948101 num_examples: 64469 download_size: 13596759 dataset_size: 69948101 - config_name: qa_c010_ans32 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 80628350 num_examples: 64469 download_size: 5772143 dataset_size: 80628350 - config_name: qa_c010_ans4 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 71652385 num_examples: 64469 download_size: 10762208 dataset_size: 71652385 - config_name: qa_c010_ans64 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 83103027 num_examples: 64475 download_size: 5749294 dataset_size: 83103027 - config_name: qa_c010_ans8 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 74143435 num_examples: 64469 download_size: 7858739 dataset_size: 74143435 - config_name: qa_c020_ans1 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 137343248 num_examples: 128939 download_size: 32277808 dataset_size: 137343248 - config_name: qa_c020_ans16 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 154177100 num_examples: 128939 download_size: 13970886 dataset_size: 154177100 - config_name: qa_c020_ans2 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 140076108 num_examples: 128939 download_size: 27188806 dataset_size: 140076108 - config_name: qa_c020_ans32 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 160083446 num_examples: 128939 download_size: 11494775 dataset_size: 160083446 - config_name: qa_c020_ans4 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 143376865 num_examples: 128939 download_size: 21531438 dataset_size: 143376865 - config_name: qa_c020_ans64 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 165760240 num_examples: 128939 download_size: 11534460 dataset_size: 165760240 - config_name: qa_c020_ans8 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 148268924 num_examples: 128939 download_size: 15709452 dataset_size: 148268924 - config_name: qa_c060_ans1 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 412193372 num_examples: 386817 download_size: 96824991 dataset_size: 412193372 - config_name: qa_c060_ans16 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 461760402 num_examples: 386817 download_size: 42049089 dataset_size: 461760402 - config_name: qa_c060_ans2 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 419934778 num_examples: 386817 download_size: 81572263 dataset_size: 419934778 - config_name: qa_c060_ans32 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 480401733 num_examples: 386821 download_size: 34499315 dataset_size: 480401733 - config_name: qa_c060_ans4 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 430958416 num_examples: 386817 download_size: 64770133 dataset_size: 430958416 - config_name: qa_c060_ans64 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 496620675 num_examples: 386865 download_size: 34320340 dataset_size: 496620675 - config_name: qa_c060_ans8 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 444883111 num_examples: 386817 download_size: 47110237 dataset_size: 444883111 - config_name: qa_c080_ans1 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 549638154 num_examples: 515756 download_size: 129100181 dataset_size: 549638154 - config_name: qa_c080_ans16 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 615154978 num_examples: 515756 download_size: 56071218 dataset_size: 615154978 - config_name: qa_c080_ans2 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 560196115 num_examples: 515756 download_size: 108827240 dataset_size: 560196115 - config_name: qa_c080_ans32 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 639649655 num_examples: 515756 download_size: 45996502 dataset_size: 639649655 - config_name: qa_c080_ans4 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 574902239 num_examples: 515756 download_size: 86428528 dataset_size: 574902239 - config_name: qa_c080_ans8 features: - name: input_ids_reveal sequence: int64 - name: attention_mask_reveal sequence: int64 - name: labels_reveal sequence: int64 - name: input_ids sequence: int32 - name: attention_mask sequence: int8 - name: labels sequence: int64 - name: start_idx dtype: int64 - name: end_idx dtype: int64 - name: index_path dtype: string - name: start_coord dtype: string - name: end_coord dtype: string - name: direction_seq dtype: string - name: direction_seq_reveal dtype: string - name: sp_distance dtype: int32 - name: coord_distance dtype: float64 splits: - name: train num_bytes: 594233518 num_examples: 515756 download_size: 62846030 dataset_size: 594233518 configs: - config_name: cov_div_d128_c010 data_files: - split: train path: cov_div_d128_c010/train-* - config_name: cov_div_d128_c015 data_files: - split: train path: cov_div_d128_c015/train-* - config_name: cov_div_d128_c020 data_files: - split: train path: cov_div_d128_c020/train-* - config_name: cov_div_d128_c030 data_files: - split: train path: cov_div_d128_c030/train-* - config_name: cov_div_d128_c040 data_files: - split: train path: cov_div_d128_c040/train-* - config_name: cov_div_d128_c060 data_files: - split: train path: cov_div_d128_c060/train-* - config_name: cov_div_d128_c080 data_files: - split: train path: cov_div_d128_c080/train-* - config_name: cov_div_d128_c100 data_files: - split: train path: cov_div_d128_c100/train-* - config_name: cov_div_d16_c005 data_files: - split: train path: cov_div_d16_c005/train-* - config_name: cov_div_d16_c010 data_files: - split: train path: cov_div_d16_c010/train-* - config_name: cov_div_d16_c015 data_files: - split: train path: cov_div_d16_c015/train-* - config_name: cov_div_d16_c020 data_files: - split: train path: cov_div_d16_c020/train-* - config_name: cov_div_d16_c030 data_files: - split: train path: cov_div_d16_c030/train-* - config_name: cov_div_d16_c040 data_files: - split: train path: cov_div_d16_c040/train-* - config_name: cov_div_d16_c060 data_files: - split: train path: cov_div_d16_c060/train-* - config_name: cov_div_d16_c080 data_files: - split: train path: cov_div_d16_c080/train-* - config_name: cov_div_d16_c100 data_files: - split: train path: cov_div_d16_c100/train-* - config_name: cov_div_d1_c005 data_files: - split: train path: cov_div_d1_c005/train-* - config_name: cov_div_d1_c010 data_files: - split: train path: cov_div_d1_c010/train-* - config_name: cov_div_d1_c015 data_files: - split: train path: cov_div_d1_c015/train-* - config_name: cov_div_d1_c020 data_files: - split: train path: cov_div_d1_c020/train-* - config_name: cov_div_d1_c030 data_files: - split: train path: cov_div_d1_c030/train-* - config_name: cov_div_d1_c040 data_files: - split: train path: cov_div_d1_c040/train-* - config_name: cov_div_d1_c060 data_files: - split: train path: cov_div_d1_c060/train-* - config_name: cov_div_d1_c080 data_files: - split: train path: cov_div_d1_c080/train-* - config_name: cov_div_d1_c100 data_files: - split: train path: cov_div_d1_c100/train-* - config_name: cov_div_d2_c005 data_files: - split: train path: cov_div_d2_c005/train-* - config_name: cov_div_d2_c010 data_files: - split: train path: cov_div_d2_c010/train-* - config_name: cov_div_d2_c015 data_files: - split: train path: cov_div_d2_c015/train-* - config_name: cov_div_d2_c020 data_files: - split: train path: cov_div_d2_c020/train-* - config_name: cov_div_d2_c030 data_files: - split: train path: cov_div_d2_c030/train-* - config_name: cov_div_d2_c040 data_files: - split: train path: cov_div_d2_c040/train-* - config_name: cov_div_d2_c060 data_files: - split: train path: cov_div_d2_c060/train-* - config_name: cov_div_d2_c080 data_files: - split: train path: cov_div_d2_c080/train-* - config_name: cov_div_d2_c100 data_files: - split: train path: cov_div_d2_c100/train-* - config_name: cov_div_d32_c005 data_files: - split: train path: cov_div_d32_c005/train-* - config_name: cov_div_d32_c010 data_files: - split: train path: cov_div_d32_c010/train-* - config_name: cov_div_d32_c015 data_files: - split: train path: cov_div_d32_c015/train-* - config_name: cov_div_d32_c020 data_files: - split: train path: cov_div_d32_c020/train-* - config_name: cov_div_d32_c030 data_files: - split: train path: cov_div_d32_c030/train-* - config_name: cov_div_d32_c040 data_files: - split: train path: cov_div_d32_c040/train-* - config_name: cov_div_d32_c060 data_files: - split: train path: cov_div_d32_c060/train-* - config_name: cov_div_d32_c080 data_files: - split: train path: cov_div_d32_c080/train-* - config_name: cov_div_d32_c100 data_files: - split: train path: cov_div_d32_c100/train-* - config_name: cov_div_d4_c005 data_files: - split: train path: cov_div_d4_c005/train-* - config_name: cov_div_d4_c010 data_files: - split: train path: cov_div_d4_c010/train-* - config_name: cov_div_d4_c015 data_files: - split: train path: cov_div_d4_c015/train-* - config_name: cov_div_d4_c020 data_files: - split: train path: cov_div_d4_c020/train-* - config_name: cov_div_d4_c030 data_files: - split: train path: cov_div_d4_c030/train-* - config_name: cov_div_d4_c040 data_files: - split: train path: cov_div_d4_c040/train-* - config_name: cov_div_d4_c060 data_files: - split: train path: cov_div_d4_c060/train-* - config_name: cov_div_d4_c080 data_files: - split: train path: cov_div_d4_c080/train-* - config_name: cov_div_d4_c100 data_files: - split: train path: cov_div_d4_c100/train-* - config_name: cov_div_d64_c005 data_files: - split: train path: cov_div_d64_c005/train-* - config_name: cov_div_d64_c010 data_files: - split: train path: cov_div_d64_c010/train-* - config_name: cov_div_d64_c015 data_files: - split: train path: cov_div_d64_c015/train-* - config_name: cov_div_d64_c020 data_files: - split: train path: cov_div_d64_c020/train-* - config_name: cov_div_d64_c030 data_files: - split: train path: cov_div_d64_c030/train-* - config_name: cov_div_d64_c040 data_files: - split: train path: cov_div_d64_c040/train-* - config_name: cov_div_d64_c060 data_files: - split: train path: cov_div_d64_c060/train-* - config_name: cov_div_d64_c080 data_files: - split: train path: cov_div_d64_c080/train-* - config_name: cov_div_d64_c100 data_files: - split: train path: cov_div_d64_c100/train-* - config_name: cov_div_d8_c005 data_files: - split: train path: cov_div_d8_c005/train-* - config_name: cov_div_d8_c010 data_files: - split: train path: cov_div_d8_c010/train-* - config_name: cov_div_d8_c015 data_files: - split: train path: cov_div_d8_c015/train-* - config_name: cov_div_d8_c020 data_files: - split: train path: cov_div_d8_c020/train-* - config_name: cov_div_d8_c030 data_files: - split: train path: cov_div_d8_c030/train-* - config_name: cov_div_d8_c040 data_files: - split: train path: cov_div_d8_c040/train-* - config_name: cov_div_d8_c060 data_files: - split: train path: cov_div_d8_c060/train-* - config_name: cov_div_d8_c080 data_files: - split: train path: cov_div_d8_c080/train-* - config_name: cov_div_d8_c100 data_files: - split: train path: cov_div_d8_c100/train-* - config_name: longshort_0_10 data_files: - split: train path: longshort_0_10/train-* - config_name: longshort_10_20 data_files: - split: train path: longshort_10_20/train-* - config_name: longshort_20_30 data_files: - split: train path: longshort_20_30/train-* - config_name: longshort_30_40 data_files: - split: train path: longshort_30_40/train-* - config_name: longshort_40_50 data_files: - split: train path: longshort_40_50/train-* - config_name: longshort_50_60 data_files: - split: train path: longshort_50_60/train-* - config_name: longshort_60_70 data_files: - split: train path: longshort_60_70/train-* - config_name: longshort_70_80 data_files: - split: train path: longshort_70_80/train-* - config_name: longshort_80_90 data_files: - split: train path: longshort_80_90/train-* - config_name: qa_c001_ans1 data_files: - split: train path: qa_c001_ans1/train-* - config_name: qa_c001_ans16 data_files: - split: train path: qa_c001_ans16/train-* - config_name: qa_c001_ans2 data_files: - split: train path: qa_c001_ans2/train-* - config_name: qa_c001_ans32 data_files: - split: train path: qa_c001_ans32/train-* - config_name: qa_c001_ans4 data_files: - split: train path: qa_c001_ans4/train-* - config_name: qa_c001_ans64 data_files: - split: train path: qa_c001_ans64/train-* - config_name: qa_c001_ans8 data_files: - split: train path: qa_c001_ans8/train-* - config_name: qa_c005_ans1 data_files: - split: train path: qa_c005_ans1/train-* - config_name: qa_c005_ans16 data_files: - split: train path: qa_c005_ans16/train-* - config_name: qa_c005_ans2 data_files: - split: train path: qa_c005_ans2/train-* - config_name: qa_c005_ans32 data_files: - split: train path: qa_c005_ans32/train-* - config_name: qa_c005_ans4 data_files: - split: train path: qa_c005_ans4/train-* - config_name: qa_c005_ans64 data_files: - split: train path: qa_c005_ans64/train-* - config_name: qa_c005_ans8 data_files: - split: train path: qa_c005_ans8/train-* - config_name: qa_c010_ans1 data_files: - split: train path: qa_c010_ans1/train-* - config_name: qa_c010_ans16 data_files: - split: train path: qa_c010_ans16/train-* - config_name: qa_c010_ans2 data_files: - split: train path: qa_c010_ans2/train-* - config_name: qa_c010_ans32 data_files: - split: train path: qa_c010_ans32/train-* - config_name: qa_c010_ans4 data_files: - split: train path: qa_c010_ans4/train-* - config_name: qa_c010_ans64 data_files: - split: train path: qa_c010_ans64/train-* - config_name: qa_c010_ans8 data_files: - split: train path: qa_c010_ans8/train-* - config_name: qa_c020_ans1 data_files: - split: train path: qa_c020_ans1/train-* - config_name: qa_c020_ans16 data_files: - split: train path: qa_c020_ans16/train-* - config_name: qa_c020_ans2 data_files: - split: train path: qa_c020_ans2/train-* - config_name: qa_c020_ans32 data_files: - split: train path: qa_c020_ans32/train-* - config_name: qa_c020_ans4 data_files: - split: train path: qa_c020_ans4/train-* - config_name: qa_c020_ans64 data_files: - split: train path: qa_c020_ans64/train-* - config_name: qa_c020_ans8 data_files: - split: train path: qa_c020_ans8/train-* - config_name: qa_c060_ans1 data_files: - split: train path: qa_c060_ans1/train-* - config_name: qa_c060_ans16 data_files: - split: train path: qa_c060_ans16/train-* - config_name: qa_c060_ans2 data_files: - split: train path: qa_c060_ans2/train-* - config_name: qa_c060_ans32 data_files: - split: train path: qa_c060_ans32/train-* - config_name: qa_c060_ans4 data_files: - split: train path: qa_c060_ans4/train-* - config_name: qa_c060_ans64 data_files: - split: train path: qa_c060_ans64/train-* - config_name: qa_c060_ans8 data_files: - split: train path: qa_c060_ans8/train-* - config_name: qa_c080_ans1 data_files: - split: train path: qa_c080_ans1/train-* - config_name: qa_c080_ans16 data_files: - split: train path: qa_c080_ans16/train-* - config_name: qa_c080_ans2 data_files: - split: train path: qa_c080_ans2/train-* - config_name: qa_c080_ans32 data_files: - split: train path: qa_c080_ans32/train-* - config_name: qa_c080_ans4 data_files: - split: train path: qa_c080_ans4/train-* - config_name: qa_c080_ans8 data_files: - split: train path: qa_c080_ans8/train-* ---
提供机构:
YnezT
5,000+
优质数据集
54 个
任务类型
进入经典数据集
二维码
社区交流群

面向社区/商业的数据集话题

二维码
科研交流群

面向高校/科研机构的开源数据集话题

数据驱动未来

携手共赢发展

商业合作