In [4]:
import hail as hl
mt = hl.balding_nichols_model(n_populations=3,
                              n_samples=500,
                              n_variants=500000,
                              n_partitions=32)
mt.show(10)
2021-06-22 17:45:44 Hail: INFO: balding_nichols_model: generating genotypes for 3 populations, 500 samples, and 500000 variants...
2021-06-22 17:45:45 Hail: INFO: Coerced sorted dataset
0
1
2
3
4
5
6
7
locus
alleles
GT
GT
GT
GT
GT
GT
GT
GT
locus<GRCh37>array<str>callcallcallcallcallcallcallcall
1:1["A","C"]0/00/00/11/10/10/00/10/1
1:2["A","C"]0/11/11/10/10/11/10/10/1
1:3["A","C"]1/11/10/10/10/10/00/01/1
1:4["A","C"]0/11/10/00/00/10/10/00/1
1:5["A","C"]0/00/00/00/00/00/01/11/1
1:6["A","C"]0/11/10/00/10/10/10/11/1
1:7["A","C"]0/10/00/01/10/00/10/10/1
1:8["A","C"]0/11/11/11/11/11/10/10/1
1:9["A","C"]1/10/11/10/11/11/11/11/1
1:10["A","C"]0/10/00/00/10/10/00/10/1

showing top 10 rows

showing the first 8 of 500 columns

In [ ]: