systemk/popular-code
收藏Hugging Face2024-02-22 更新2024-03-04 收录
下载链接:
https://hf-mirror.com/datasets/systemk/popular-code
下载链接
链接失效反馈官方服务:
资源简介:
---
dataset_info:
- config_name: assembly
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 185152071.87902868
num_examples: 22311
- name: test
num_bytes: 20580751.120971322
num_examples: 2480
download_size: 67003168
dataset_size: 205732823.0
- config_name: batchfile
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 20075860.935047586
num_examples: 21560
- name: test
num_bytes: 2231065.0649524126
num_examples: 2396
download_size: 9992348
dataset_size: 22306926.0
- config_name: c
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: float64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 5067481722.438739
num_examples: 768311
- name: test
num_bytes: 563054257.5612613
num_examples: 85368
download_size: 1959592942
dataset_size: 5630535980.0
- config_name: c-sharp
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: float64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 4592570709.738392
num_examples: 972115
- name: test
num_bytes: 510286684.2616079
num_examples: 108013
download_size: 1518897077
dataset_size: 5102857394.0
- config_name: cmake
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 32188311.28346837
num_examples: 16773
- name: test
num_bytes: 3577118.7165316306
num_examples: 1864
download_size: 14604243
dataset_size: 35765430.0
- config_name: cpp
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: float64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 4768231984.89816
num_examples: 571816
- name: test
num_bytes: 529810966.1018396
num_examples: 63536
download_size: 1728320661
dataset_size: 5298042951.0
- config_name: css
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 848462306.4871161
num_examples: 244944
- name: test
num_bytes: 94277053.51288392
num_examples: 27217
download_size: 307876548
dataset_size: 942739360.0
- config_name: default
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 60424176321.07302
num_examples: 13520621
- name: test
num_bytes: 6713800844.926977
num_examples: 1502292
download_size: 25214779682
dataset_size: 67137977166.0
- config_name: dockerfile
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 40861170.9
num_examples: 51435
- name: test
num_bytes: 4540130.1
num_examples: 5715
download_size: 22383514
dataset_size: 45401301.0
- config_name: fortran
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 116444383.79079287
num_examples: 14291
- name: test
num_bytes: 12939170.209207129
num_examples: 1588
download_size: 43286400
dataset_size: 129383554.0
- config_name: go
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 2207276664.435403
num_examples: 423046
- name: test
num_bytes: 245257600.5645971
num_examples: 47006
download_size: 825463406
dataset_size: 2452534265.0
- config_name: haskell
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 208607302.55979314
num_examples: 48730
- name: test
num_bytes: 23180967.44020685
num_examples: 5415
download_size: 86706642
dataset_size: 231788270.0
- config_name: html
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 2892607238.080207
num_examples: 296996
- name: test
num_bytes: 321405132.91979295
num_examples: 33000
download_size: 1019975731
dataset_size: 3214012371.0
- config_name: java
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 8559534877.711628
num_examples: 1806459
- name: test
num_bytes: 951061010.2883722
num_examples: 200718
download_size: 3173260121
dataset_size: 9510595888.0
- config_name: javascript
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 5891105157.969938
num_examples: 1758985
- name: test
num_bytes: 654567984.030062
num_examples: 195443
download_size: 2451299575
dataset_size: 6545673142.0
- config_name: julia
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 118357902.97670639
num_examples: 26582
- name: test
num_bytes: 13152857.023293607
num_examples: 2954
download_size: 50895242
dataset_size: 131510760.0
- config_name: lua
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 285155371.2303212
num_examples: 49450
- name: test
num_bytes: 31687133.76967877
num_examples: 5495
download_size: 109173752
dataset_size: 316842505.0
- config_name: makefile
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 95894814.03596312
num_examples: 59160
- name: test
num_bytes: 10656059.964036876
num_examples: 6574
download_size: 42748861
dataset_size: 106550874.0
- config_name: markdown
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 8089968231.110576
num_examples: 1892635
- name: test
num_bytes: 898886308.8894247
num_examples: 210293
download_size: 4412277013
dataset_size: 8988854540.0
- config_name: perl
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 165252209.2220307
num_examples: 32894
- name: test
num_bytes: 18361914.7779693
num_examples: 3655
download_size: 73056742
dataset_size: 183614124.0
- config_name: php
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 4670622386.956541
num_examples: 1411470
- name: test
num_bytes: 518961352.0434591
num_examples: 156831
download_size: 1831244889
dataset_size: 5189583739.0
- config_name: powershell
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 107302772.56389657
num_examples: 24085
- name: test
num_bytes: 11926490.43610343
num_examples: 2677
download_size: 40851866
dataset_size: 119229263.0
- config_name: python
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 5828118254.741786
num_examples: 1157997
- name: test
num_bytes: 647572050.2582142
num_examples: 128667
download_size: 2401359464
dataset_size: 6475690305.0
- config_name: ruby
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 683527631.192737
num_examples: 305128
- name: test
num_bytes: 75949505.80726303
num_examples: 33904
download_size: 294077915
dataset_size: 759477137.0
- config_name: rust
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 736780485.8990481
num_examples: 124241
- name: test
num_bytes: 81867134.10095185
num_examples: 13805
download_size: 255662703
dataset_size: 818647620.0
- config_name: scala
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 405211398.3278998
num_examples: 122020
- name: test
num_bytes: 45024226.672100194
num_examples: 13558
download_size: 170432747
dataset_size: 450235625.0
- config_name: shell
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 292522541.8715689
num_examples: 198568
- name: test
num_bytes: 32503814.128431052
num_examples: 22064
download_size: 151818390
dataset_size: 325026356.0
- config_name: sql
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 423121499.70790017
num_examples: 87787
- name: test
num_bytes: 47017784.29209981
num_examples: 9755
download_size: 135894444
dataset_size: 470139284.0
- config_name: tex
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 521708011.01700556
num_examples: 47049
- name: test
num_bytes: 57971252.98299444
num_examples: 5228
download_size: 244760184
dataset_size: 579679264.0
- config_name: typescript
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 2497822556.7624574
num_examples: 949259
- name: test
num_bytes: 277537886.23754257
num_examples: 105474
download_size: 1039368886
dataset_size: 2775360443.0
- config_name: visual-basic
features:
- name: max_stars_repo_path
dtype: string
- name: max_stars_repo_name
dtype: string
- name: max_stars_count
dtype: int64
- name: id
dtype: string
- name: content
dtype: string
- name: language
dtype: string
splits:
- name: train
num_bytes: 72145624.30813125
num_examples: 14510
- name: test
num_bytes: 8020047.691868759
num_examples: 1613
download_size: 24980666
dataset_size: 80165672.0
configs:
- config_name: assembly
data_files:
- split: train
path: assembly/train-*
- split: test
path: assembly/test-*
- config_name: batchfile
data_files:
- split: train
path: batchfile/train-*
- split: test
path: batchfile/test-*
- config_name: c
data_files:
- split: train
path: c/train-*
- split: test
path: c/test-*
- config_name: c-sharp
data_files:
- split: train
path: c-sharp/train-*
- split: test
path: c-sharp/test-*
- config_name: cmake
data_files:
- split: train
path: cmake/train-*
- split: test
path: cmake/test-*
- config_name: cpp
data_files:
- split: train
path: cpp/train-*
- split: test
path: cpp/test-*
- config_name: css
data_files:
- split: train
path: css/train-*
- split: test
path: css/test-*
- config_name: default
data_files:
- split: train
path: data/train-*
- split: test
path: data/test-*
- config_name: dockerfile
data_files:
- split: train
path: dockerfile/train-*
- split: test
path: dockerfile/test-*
- config_name: fortran
data_files:
- split: train
path: fortran/train-*
- split: test
path: fortran/test-*
- config_name: go
data_files:
- split: train
path: go/train-*
- split: test
path: go/test-*
- config_name: haskell
data_files:
- split: train
path: haskell/train-*
- split: test
path: haskell/test-*
- config_name: html
data_files:
- split: train
path: html/train-*
- split: test
path: html/test-*
- config_name: java
data_files:
- split: train
path: java/train-*
- split: test
path: java/test-*
- config_name: javascript
data_files:
- split: train
path: javascript/train-*
- split: test
path: javascript/test-*
- config_name: julia
data_files:
- split: train
path: julia/train-*
- split: test
path: julia/test-*
- config_name: lua
data_files:
- split: train
path: lua/train-*
- split: test
path: lua/test-*
- config_name: makefile
data_files:
- split: train
path: makefile/train-*
- split: test
path: makefile/test-*
- config_name: markdown
data_files:
- split: train
path: markdown/train-*
- split: test
path: markdown/test-*
- config_name: perl
data_files:
- split: train
path: perl/train-*
- split: test
path: perl/test-*
- config_name: php
data_files:
- split: train
path: php/train-*
- split: test
path: php/test-*
- config_name: powershell
data_files:
- split: train
path: powershell/train-*
- split: test
path: powershell/test-*
- config_name: python
data_files:
- split: train
path: python/train-*
- split: test
path: python/test-*
- config_name: ruby
data_files:
- split: train
path: ruby/train-*
- split: test
path: ruby/test-*
- config_name: rust
data_files:
- split: train
path: rust/train-*
- split: test
path: rust/test-*
- config_name: scala
data_files:
- split: train
path: scala/train-*
- split: test
path: scala/test-*
- config_name: shell
data_files:
- split: train
path: shell/train-*
- split: test
path: shell/test-*
- config_name: sql
data_files:
- split: train
path: sql/train-*
- split: test
path: sql/test-*
- config_name: tex
data_files:
- split: train
path: tex/train-*
- split: test
path: tex/test-*
- config_name: typescript
data_files:
- split: train
path: typescript/train-*
- split: test
path: typescript/test-*
- config_name: visual-basic
data_files:
- split: train
path: visual-basic/train-*
- split: test
path: visual-basic/test-*
---
提供机构:
systemk
原始信息汇总
数据集概述
数据集配置
配置名称:assembly
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 185152071.87902868 字节, 22311 个样本
- test: 20580751.120971322 字节, 2480 个样本
- 下载大小:67003168 字节
- 数据集大小:205732823.0 字节
配置名称:batchfile
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 20075860.935047586 字节, 21560 个样本
- test: 2231065.0649524126 字节, 2396 个样本
- 下载大小:9992348 字节
- 数据集大小:22306926.0 字节
配置名称:c
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: float64
- id: string
- content: string
- language: string
- 分割:
- train: 5067481722.438739 字节, 768311 个样本
- test: 563054257.5612613 字节, 85368 个样本
- 下载大小:1959592942 字节
- 数据集大小:5630535980.0 字节
配置名称:c-sharp
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: float64
- id: string
- content: string
- language: string
- 分割:
- train: 4592570709.738392 字节, 972115 个样本
- test: 510286684.2616079 字节, 108013 个样本
- 下载大小:1518897077 字节
- 数据集大小:5102857394.0 字节
配置名称:cmake
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 32188311.28346837 字节, 16773 个样本
- test: 3577118.7165316306 字节, 1864 个样本
- 下载大小:14604243 字节
- 数据集大小:35765430.0 字节
配置名称:cpp
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: float64
- id: string
- content: string
- language: string
- 分割:
- train: 4768231984.89816 字节, 571816 个样本
- test: 529810966.1018396 字节, 63536 个样本
- 下载大小:1728320661 字节
- 数据集大小:5298042951.0 字节
配置名称:css
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 848462306.4871161 字节, 244944 个样本
- test: 94277053.51288392 字节, 27217 个样本
- 下载大小:307876548 字节
- 数据集大小:942739360.0 字节
配置名称:default
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 60424176321.07302 字节, 13520621 个样本
- test: 6713800844.926977 字节, 1502292 个样本
- 下载大小:25214779682 字节
- 数据集大小:67137977166.0 字节
配置名称:dockerfile
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 40861170.9 字节, 51435 个样本
- test: 4540130.1 字节, 5715 个样本
- 下载大小:22383514 字节
- 数据集大小:45401301.0 字节
配置名称:fortran
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 116444383.79079287 字节, 14291 个样本
- test: 12939170.209207129 字节, 1588 个样本
- 下载大小:43286400 字节
- 数据集大小:129383554.0 字节
配置名称:go
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 2207276664.435403 字节, 423046 个样本
- test: 245257600.5645971 字节, 47006 个样本
- 下载大小:825463406 字节
- 数据集大小:2452534265.0 字节
配置名称:haskell
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 208607302.55979314 字节, 48730 个样本
- test: 23180967.44020685 字节, 5415 个样本
- 下载大小:86706642 字节
- 数据集大小:231788270.0 字节
配置名称:html
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 2892607238.080207 字节, 296996 个样本
- test: 321405132.91979295 字节, 33000 个样本
- 下载大小:1019975731 字节
- 数据集大小:3214012371.0 字节
配置名称:java
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 8559534877.711628 字节, 1806459 个样本
- test: 951061010.2883722 字节, 200718 个样本
- 下载大小:3173260121 字节
- 数据集大小:9510595888.0 字节
配置名称:javascript
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 5891105157.969938 字节, 1758985 个样本
- test: 654567984.030062 字节, 195443 个样本
- 下载大小:2451299575 字节
- 数据集大小:6545673142.0 字节
配置名称:julia
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 118357902.97670639 字节, 26582 个样本
- test: 13152857.023293607 字节, 2954 个样本
- 下载大小:50895242 字节
- 数据集大小:131510760.0 字节
配置名称:lua
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 285155371.2303212 字节, 49450 个样本
- test: 31687133.76967877 字节, 5495 个样本
- 下载大小:109173752 字节
- 数据集大小:316842505.0 字节
配置名称:makefile
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 95894814.03596312 字节, 59160 个样本
- test: 10656059.964036876 字节, 6574 个样本
- 下载大小:42748861 字节
- 数据集大小:106550874.0 字节
配置名称:- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 8089968231.110576 字节, 1892635 个样本
- test: 898886308.8894247 字节, 210293 个样本
- 下载大小:4412277013 字节
- 数据集大小:8988854540.0 字节
配置名称:perl
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 165252209.2220307 字节, 32894 个样本
- test: 18361914.7779693 字节, 3655 个样本
- 下载大小:73056742 字节
- 数据集大小:183614124.0 字节
配置名称:php
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 4670622386.956541 字节, 1411470 个样本
- test: 518961352.0434591 字节, 156831 个样本
- 下载大小:1831244889 字节
- 数据集大小:5189583739.0 字节
配置名称:powershell
- 特征:
- max_stars_repo_path: string
- max_stars_repo_name: string
- max_stars_count: int64
- id: string
- content: string
- language: string
- 分割:
- train: 107302772.56389657 字节, 24085 个样本
- test: 11926490.4



