| \n", + " | swiss_id | \n", + "accession | \n", + "go_ids | \n", + "sequence | \n", + "41 | \n", + "75 | \n", + "122 | \n", + "165 | \n", + "209 | \n", + "226 | \n", + "... | \n", + "1990778 | \n", + "2000026 | \n", + "2000145 | \n", + "2000146 | \n", + "2000147 | \n", + "2000241 | \n", + "2000243 | \n", + "2001141 | \n", + "2001233 | \n", + "2001234 | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1 | \n", + "11S1_CARIL | \n", + "B5KVH4 | \n", + "[3006, 8150, 9791, 10431, 21700, 22414, 32501,... | \n", + "MAKPILLSIYLCLIIVALFNGCLAQSGGRQQHKFGQCQLNRLDALE... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "
| 3 | \n", + "11S2_SESIN | \n", + "Q9XHP0 | \n", + "[3006, 8150, 10431, 21700, 22414, 32502, 48609] | \n", + "MVAFKFLLALSLSLLVSAAIAQTREPRLTQGQQCRFQRISGAQPSL... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "
| 6 | \n", + "14310_ARATH | \n", + "P48347,Q9LME5 | \n", + "[7165, 8150, 9742, 9755, 9987, 43401, 50789, 5... | \n", + "MENEREKQVYLAKLSEQTERYDEMVEAMKKVAQLDVELTVEERNLV... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "
| 8 | \n", + "14331_ARATH | \n", + "P42643,Q945M2,Q9M0S7 | \n", + "[8150, 19222, 50789, 65007] | \n", + "MATPGASSARDEFVYMAKLAEQAERYEEMVEFMEKVAKAVDKDELT... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "
| 9 | \n", + "14331_CAEEL | \n", + "P41932,Q21537 | \n", + "[132, 226, 1708, 6611, 6810, 6886, 6913, 6950,... | \n", + "MSDTVEELVQRAKLAEQAERYDDMAAAMKKVTEQGQELSNEERNLL... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "True | \n", + "... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "
5 rows Γ 902 columns
\n", + "| \n", + " | id | \n", + "split | \n", + "
|---|---|---|
| 0 | \n", + "14331_ARATH | \n", + "train | \n", + "
| 1 | \n", + "14331_CAEEL | \n", + "train | \n", + "
| 2 | \n", + "14331_MAIZE | \n", + "train | \n", + "
| 3 | \n", + "14332_MAIZE | \n", + "train | \n", + "
| 4 | \n", + "14333_ARATH | \n", + "train | \n", + "
| \n", + " | id | \n", + "sids | \n", + "sequence | \n", + "class_46456 | \n", + "class_48724 | \n", + "class_51349 | \n", + "class_53931 | \n", + "class_56572 | \n", + "class_56835 | \n", + "class_56992 | \n", + "... | \n", + "species_187294 | \n", + "species_56257 | \n", + "species_186882 | \n", + "species_56690 | \n", + "species_161316 | \n", + "species_57962 | \n", + "species_58067 | \n", + "species_267696 | \n", + "species_311502 | \n", + "species_311501 | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "1 | \n", + "[d4oq9a_, d4oq9b_, d4oq9c_, d4oq9d_, d4niaa_, ... | \n", + "AAAAAAAAAA | \n", + "False | \n", + "True | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "
| 1 | \n", + "2 | \n", + "[d7dxhc_] | \n", + "AAAAAAAAAAAAAAAAAAAAAAA | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "True | \n", + "False | \n", + "... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "
| 2 | \n", + "3 | \n", + "[d1gkub1, d1gkub2, d1gkub3, d1gkub4] | \n", + "AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAASLCLFPEDFLLKEF... | \n", + "False | \n", + "False | \n", + "True | \n", + "False | \n", + "True | \n", + "False | \n", + "False | \n", + "... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "True | \n", + "
| 3 | \n", + "4 | \n", + "[d3c9wa2, d3c9wb2, d3c9wa3, d3c9wb3] | \n", + "AAAAAAGPEMVRGQVFDVGPRYTNLSYIGEGAYGMVCSAYDNLNKV... | \n", + "False | \n", + "False | \n", + "False | \n", + "True | \n", + "False | \n", + "False | \n", + "False | \n", + "... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "True | \n", + "
| 4 | \n", + "5 | \n", + "[d1xwaa1, d1xwab_, d1xwac_, d1xwad_, d1xwaa2] | \n", + "AAAAAMVYQVKDKADLDGQLTKASGKLVVLDFFATWCGPCKMISPK... | \n", + "False | \n", + "False | \n", + "True | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "... | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "False | \n", + "True | \n", + "
5 rows Γ 1035 columns
\n", + "| \n", + " | id | \n", + "split | \n", + "
|---|---|---|
| 0 | \n", + "1 | \n", + "train | \n", + "
| 1 | \n", + "3 | \n", + "train | \n", + "
| 2 | \n", + "4 | \n", + "train | \n", + "
| 3 | \n", + "6 | \n", + "train | \n", + "
| 4 | \n", + "9 | \n", + "train | \n", + "