Dataset Viewer
Auto-converted to Parquet Duplicate
chain_uid
stringlengths
6
8
pdb_id
stringlengths
4
4
label_asym_id
stringlengths
1
3
auth_asym_id
stringlengths
1
4
entity_id
stringclasses
165 values
seqs
stringlengths
2
8.57k
sequence_hash
stringlengths
28
28
assembly_ids
listlengths
1
11
method
stringclasses
10 values
resolution
float64
0.48
70
release_date
stringdate
1976-05-19 00:00:00
2026-06-24 00:00:00
observed_ca_fraction
float64
0
1
standard_aa_fraction
float64
0
1
quality_tier
stringclasses
3 values
sequence_cluster_30
stringlengths
28
28
structure_cluster
stringlengths
23
23
split_component
stringlengths
26
26
split
stringclasses
1 value
member_count
int64
1
2.58k
representative_chain_id
stringlengths
6
8
7dvd_E
7dvd
E
E
2
EIGAQLRRMADDLNA
seq_49f56b636a9463f8200600e1
[ "5" ]
X-RAY DIFFRACTION
2.59
2021-08-04
1
1
low_quality
seq_49f56b636a9463f8200600e1
struct_def5dbf48fc302c7
component_3f8b289bd5ed90ed
train
1
7dvd_E
8gjs_B
8gjs
B
B
2
XLTFXEYWAQLLAAAAAA
seq_2972d14d2f2affdb3144697f
[ "2" ]
X-RAY DIFFRACTION
1.56
2023-07-26
0.777778
0.888889
low_quality
seq_2972d14d2f2affdb3144697f
struct_ccd94f698c695660
component_3f8b289bd5ed90ed
train
1
8gjs_B
4l67_B
4l67
B
B
2
PRQWQSLIEESARRPKPLVDPACIT
seq_8179aa95dfe8ad8bd08a0a39
[ "2" ]
X-RAY DIFFRACTION
2.8
2013-08-14
0.8
1
extended
seq_8179aa95dfe8ad8bd08a0a39
struct_840cb6d92eeb5ccf
component_3f8b289bd5ed90ed
train
1
4l67_B
2z5n_B
2z5n
B
B
2
YSNQQSGYGKVSRRGGHQNSYKPY
seq_9dc99e7323a4e28e2df0652f
[ "2" ]
X-RAY DIFFRACTION
3.2
2007-10-23
0.625
1
extended
seq_9dc99e7323a4e28e2df0652f
struct_ee0d809a4bdd95b3
component_3f8b289bd5ed90ed
train
1
2z5n_B
200l_A
200l
A
A
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMAQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_6642496e01888363cfbe50c9
[ "1" ]
X-RAY DIFFRACTION
1.95
1996-03-08
0.987805
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
4
200l_A
101m_A
101m
A
A
1
MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRVKHLKTEAEMKASEDLKKHGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG
seq_d252e12ea80505784e26ecbf
[ "1" ]
X-RAY DIFFRACTION
2.07
1998-04-08
1
1
core
seq_fb0ff316e972937b8152db3a
struct_e448a8132443a193
component_3f8b289bd5ed90ed
train
4
1mym_A
201l_A
201l
A
A
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKHPAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_0533b597b5311f6a56b83d92
[ "1" ]
X-RAY DIFFRACTION
2
1994-01-31
0.987952
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
2
201l_B
201l_B
201l
B
B
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKHPAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_0533b597b5311f6a56b83d92
[ "2" ]
X-RAY DIFFRACTION
2
1994-01-31
1
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
2
201l_B
102l_A
102l
A
A
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAAKSELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_ef78343c5b60c127a98f1d12
[ "1" ]
X-RAY DIFFRACTION
1.74
1993-10-31
0.987879
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
1
102l_A
102m_A
102m
A
A
1
MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKAGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG
seq_7762da8704b65f9798e48420
[ "1" ]
X-RAY DIFFRACTION
1.84
1998-04-08
1
1
core
seq_fb0ff316e972937b8152db3a
struct_e448a8132443a193
component_3f8b289bd5ed90ed
train
12
5ilm_A
103l_A
103l
A
A
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNSLDAAKSELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_93fee99256cf88732db6022f
[ "1" ]
X-RAY DIFFRACTION
1.9
1993-10-31
0.952096
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
1
103l_A
103m_A
103m
A
A
1
MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKAGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG
seq_7762da8704b65f9798e48420
[ "1" ]
X-RAY DIFFRACTION
2.07
1998-04-08
1
1
core
seq_fb0ff316e972937b8152db3a
struct_e448a8132443a193
component_3f8b289bd5ed90ed
train
12
5ilm_A
104l_A
104l
A
A
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSAAELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_29581997a20b78f493653784
[ "1" ]
X-RAY DIFFRACTION
2.8
1993-10-31
0.987952
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
2
104l_A
104l_B
104l
B
B
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSAAELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_29581997a20b78f493653784
[ "2" ]
X-RAY DIFFRACTION
2.8
1993-10-31
0.987952
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
2
104l_A
104m_A
104m
A
A
1
VLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGDFGADAQGAMNKALELFRKDIAAKYKELGYQG
seq_4e1e5bdd96abfd0c314159fd
[ "1" ]
X-RAY DIFFRACTION
1.71
1998-04-08
1
1
core
seq_fb0ff316e972937b8152db3a
struct_e448a8132443a193
component_3f8b289bd5ed90ed
train
82
2ekt_A
105m_A
105m
A
A
1
VLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGDFGADAQGAMNKALELFRKDIAAKYKELGYQG
seq_4e1e5bdd96abfd0c314159fd
[ "1" ]
X-RAY DIFFRACTION
2.02
1998-04-08
1
1
core
seq_fb0ff316e972937b8152db3a
struct_e448a8132443a193
component_3f8b289bd5ed90ed
train
82
2ekt_A
205l_A
205l
A
A
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSAAAELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_165b1a0fba32e47f2770d46d
[ "1" ]
X-RAY DIFFRACTION
2.1
1994-01-31
0.952096
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
1
205l_A
106m_A
106m
A
A
1
MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTFLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG
seq_efeee66808c25d1bd8c64d00
[ "1" ]
X-RAY DIFFRACTION
1.99
1998-04-08
1
1
core
seq_fb0ff316e972937b8152db3a
struct_e448a8132443a193
component_3f8b289bd5ed90ed
train
6
1mll_A
206l_A
206l
A
A
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNASKSELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_56f25cb14e837a305e73f7fa
[ "1" ]
X-RAY DIFFRACTION
1.75
1996-08-17
0.987805
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
1
206l_A
107l_A
107l
A
A
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKGELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_05bad0eeac35d610558735c1
[ "1" ]
X-RAY DIFFRACTION
1.8
1993-10-31
0.987805
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
1
107l_A
107m_A
107m
A
A
1
MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTFLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG
seq_efeee66808c25d1bd8c64d00
[ "1" ]
X-RAY DIFFRACTION
2.09
1998-04-08
1
1
core
seq_fb0ff316e972937b8152db3a
struct_e448a8132443a193
component_3f8b289bd5ed90ed
train
6
1mll_A
207l_A
207l
A
A
1
KVFERCELARTLKRLGMDGYRGISLANWMCLAKWESGYNTRATNYNAGDRSTDYGIFQINSRYWCNDGKTPGAVNAAHLSCSALLQDNIADAVACAKRVVRDPQGIRAWVAWRNRCQNRDVRQYVQGCGV
seq_0b1f7f2773d6dc1237cb7460
[ "1" ]
X-RAY DIFFRACTION
1.75
1996-10-14
1
1
core
seq_1b6af75dd3c91cecedd7194a
struct_af742d4f61faba4f
component_3f8b289bd5ed90ed
train
4
207l_A
108l_A
108l
A
A
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKIELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_381e137b01eb744dea5516de
[ "1" ]
X-RAY DIFFRACTION
1.8
1993-10-31
0.987805
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
1
108l_A
108m_A
108m
A
A
1
MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTFLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG
seq_efeee66808c25d1bd8c64d00
[ "1" ]
X-RAY DIFFRACTION
2.67
1998-05-20
1
1
core
seq_fb0ff316e972937b8152db3a
struct_e448a8132443a193
component_3f8b289bd5ed90ed
train
6
1mll_A
208l_A
208l
A
A
1
KVFERCELARTLKRLGMDGYRGISLANWMCLAKWESGYNTRATNYNAGDRSTDYGIFQINSRYWCNDGKTPGAVNAAHLSCSALLQDNIADAVACAKRVVRDPQGIRAWVAWRNRCQNRDVRQYVQGCGV
seq_0b1f7f2773d6dc1237cb7460
[ "1" ]
X-RAY DIFFRACTION
1.8
1996-10-14
1
1
core
seq_1b6af75dd3c91cecedd7194a
struct_af742d4f61faba4f
component_3f8b289bd5ed90ed
train
4
207l_A
109l_A
109l
A
A
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKKELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_26be00d0f75767c685201906
[ "1" ]
X-RAY DIFFRACTION
1.85
1993-10-31
0.987805
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
1
109l_A
109m_A
109m
A
A
1
MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG
seq_7068ee572ee196e373d3371a
[ "1" ]
X-RAY DIFFRACTION
1.83
1998-04-08
1
1
core
seq_fb0ff316e972937b8152db3a
struct_e448a8132443a193
component_3f8b289bd5ed90ed
train
26
1jw8_A
209d_C
209d
C
C
2
TVPGVXTVPGV
seq_f1490965ba1401b8776ff444
[ "1" ]
X-RAY DIFFRACTION
3
1995-10-15
0.363636
0.909091
low_quality
seq_f1490965ba1401b8776ff444
struct_8d2f10f4b300c5e6
component_3f8b289bd5ed90ed
train
59
1qfi_A
209l_A
209l
A
A
1
MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKAIGRNTNGVITKDEAEKLFNQDVDAAAAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL
seq_be5b777b7a3781b22a595b9d
[ "1" ]
X-RAY DIFFRACTION
2.7
1996-12-23
0.988024
1
core
seq_431e4645a02f8a5bc01ebc6b
struct_519869b66e394cbb
component_3f8b289bd5ed90ed
train
1
209l_A
10ad_A
10ad
A
E
1
MDALIIPVTMEVPCDSRGQRMWWAFLASSMVTFFGGLFIILLWRTLKYLWTVCCHCGGKTKEAQKINNGSSQADGTLKPVDEKEEAVAAEVGWMTSVKDWAGVMISAQTLTGRVLVVLVFALSIGALVIYFIDSSNPIESCQNFYKDFTLQIDMAFNVFFLLYFGLRFIAANDKLWFWLEVNSVVDFFTVPPVFVSVYLNRSWLGLRFLRALRLIQFSEILQFLNILKTSNSIKLVNLLSIFISTWLTAAGFIHLVENSGDPWENFQNNQALTYWECVYLLMVTMSTVGYGDVYAKTTLGRLFMVFFILGGLAMFASYVP...
seq_b48877120660dd28bb133cdd
[ "1" ]
ELECTRON MICROSCOPY
3.44
2026-02-04
0.785265
1
extended
seq_088fe509fecb2499d15f55d5
struct_ccfd713d07f16c59
component_3f8b289bd5ed90ed
train
4
10ad_A
10ad_B
10ad
B
C
1
MDALIIPVTMEVPCDSRGQRMWWAFLASSMVTFFGGLFIILLWRTLKYLWTVCCHCGGKTKEAQKINNGSSQADGTLKPVDEKEEAVAAEVGWMTSVKDWAGVMISAQTLTGRVLVVLVFALSIGALVIYFIDSSNPIESCQNFYKDFTLQIDMAFNVFFLLYFGLRFIAANDKLWFWLEVNSVVDFFTVPPVFVSVYLNRSWLGLRFLRALRLIQFSEILQFLNILKTSNSIKLVNLLSIFISTWLTAAGFIHLVENSGDPWENFQNNQALTYWECVYLLMVTMSTVGYGDVYAKTTLGRLFMVFFILGGLAMFASYVP...
seq_b48877120660dd28bb133cdd
[ "1" ]
ELECTRON MICROSCOPY
3.44
2026-02-04
0.785265
1
extended
seq_088fe509fecb2499d15f55d5
struct_ccfd713d07f16c59
component_3f8b289bd5ed90ed
train
4
10ad_A
10ad_C
10ad
C
D
1
MDALIIPVTMEVPCDSRGQRMWWAFLASSMVTFFGGLFIILLWRTLKYLWTVCCHCGGKTKEAQKINNGSSQADGTLKPVDEKEEAVAAEVGWMTSVKDWAGVMISAQTLTGRVLVVLVFALSIGALVIYFIDSSNPIESCQNFYKDFTLQIDMAFNVFFLLYFGLRFIAANDKLWFWLEVNSVVDFFTVPPVFVSVYLNRSWLGLRFLRALRLIQFSEILQFLNILKTSNSIKLVNLLSIFISTWLTAAGFIHLVENSGDPWENFQNNQALTYWECVYLLMVTMSTVGYGDVYAKTTLGRLFMVFFILGGLAMFASYVP...
seq_b48877120660dd28bb133cdd
[ "1" ]
ELECTRON MICROSCOPY
3.44
2026-02-04
0.785265
1
extended
seq_088fe509fecb2499d15f55d5
struct_ccfd713d07f16c59
component_3f8b289bd5ed90ed
train
4
10ad_A
10ad_D
10ad
D
A
1
MDALIIPVTMEVPCDSRGQRMWWAFLASSMVTFFGGLFIILLWRTLKYLWTVCCHCGGKTKEAQKINNGSSQADGTLKPVDEKEEAVAAEVGWMTSVKDWAGVMISAQTLTGRVLVVLVFALSIGALVIYFIDSSNPIESCQNFYKDFTLQIDMAFNVFFLLYFGLRFIAANDKLWFWLEVNSVVDFFTVPPVFVSVYLNRSWLGLRFLRALRLIQFSEILQFLNILKTSNSIKLVNLLSIFISTWLTAAGFIHLVENSGDPWENFQNNQALTYWECVYLLMVTMSTVGYGDVYAKTTLGRLFMVFFILGGLAMFASYVP...
seq_b48877120660dd28bb133cdd
[ "1" ]
ELECTRON MICROSCOPY
3.44
2026-02-04
0.785265
1
extended
seq_088fe509fecb2499d15f55d5
struct_ccfd713d07f16c59
component_3f8b289bd5ed90ed
train
4
10ad_A
10af_A
10af
A
A
1
MAHHHHHHMSRPHVFFDITIGGSNAGRIVMELFADIVPKTAENFRCLCTGERGMGRSGKKLHYKGSKFHRVIPNFMLQGGDFTRGNGTGGESIYGEKFPDENFQEKHTGPGVLSMANAGPNTNGSQFFICTAKTEWLDGKHVVFGRVVEGMNVVKAVESKGSQSGRTSADIVIADCGQL
seq_a1f700ab62fc9048d6c89952
[ "1" ]
X-RAY DIFFRACTION
1.25
2026-01-21
0.949721
1
core
seq_639d20e1b4c5fd1474620f19
struct_5c276d9f03a7be39
component_3f8b289bd5ed90ed
train
1
10af_A
10ah_A
10ah
A
A
1
SNAGGSSPITGLVYDQRMMLHHNMWDSHHPELPQRISRIFSRHEELRLLSRCHRIPARLATEEELALCHSSKHISIIKSSEHMKPRDLNRLGDEYDSIFISNESYTCALLAAGSCFNSAQAILTGQVRNAVAIVRPPGHHAEKDTACGFCFFNTAALTARYAQSITRESLRVLIVDWDVHHGNGTQHIFEEDDSVLYISLHRYEDGAFFPNSEDANYDKVGLGKGRGYNVNIPWNGGKMGDPEYMAAFHHLVMPIAREFAPELVLVSAGFDAARGDPLGGFQVTPEGYAHLTHQLMSLAAGRVLIILEGGYNLTSISESM...
seq_be307890dd23905f77cdfafa
[ "1" ]
X-RAY DIFFRACTION
2.2
2026-06-17
0.978022
1
core
seq_cfa6024209130a23601f5d2d
struct_1aaf3c4c36263840
component_3f8b289bd5ed90ed
train
4
10ai_A
10ah_B
10ah
B
B
1
SNAGGSSPITGLVYDQRMMLHHNMWDSHHPELPQRISRIFSRHEELRLLSRCHRIPARLATEEELALCHSSKHISIIKSSEHMKPRDLNRLGDEYDSIFISNESYTCALLAAGSCFNSAQAILTGQVRNAVAIVRPPGHHAEKDTACGFCFFNTAALTARYAQSITRESLRVLIVDWDVHHGNGTQHIFEEDDSVLYISLHRYEDGAFFPNSEDANYDKVGLGKGRGYNVNIPWNGGKMGDPEYMAAFHHLVMPIAREFAPELVLVSAGFDAARGDPLGGFQVTPEGYAHLTHQLMSLAAGRVLIILEGGYNLTSISESM...
seq_be307890dd23905f77cdfafa
[ "2" ]
X-RAY DIFFRACTION
2.2
2026-06-17
0.978022
1
core
seq_cfa6024209130a23601f5d2d
struct_1aaf3c4c36263840
component_3f8b289bd5ed90ed
train
4
10ai_A
10ai_A
10ai
A
A
1
SNAGGSSPITGLVYDQRMMLHHNMWDSHHPELPQRISRIFSRHEELRLLSRCHRIPARLATEEELALCHSSKHISIIKSSEHMKPRDLNRLGDEYDSIFISNESYTCALLAAGSCFNSAQAILTGQVRNAVAIVRPPGHHAEKDTACGFCFFNTAALTARYAQSITRESLRVLIVDWDVHHGNGTQHIFEEDDSVLYISLHRYEDGAFFPNSEDANYDKVGLGKGRGYNVNIPWNGGKMGDPEYMAAFHHLVMPIAREFAPELVLVSAGFDAARGDPLGGFQVTPEGYAHLTHQLMSLAAGRVLIILEGGYNLTSISESM...
seq_be307890dd23905f77cdfafa
[ "1" ]
X-RAY DIFFRACTION
2.1
2026-06-17
0.978022
1
core
seq_cfa6024209130a23601f5d2d
struct_1aaf3c4c36263840
component_3f8b289bd5ed90ed
train
4
10ai_A
10ai_B
10ai
B
B
1
SNAGGSSPITGLVYDQRMMLHHNMWDSHHPELPQRISRIFSRHEELRLLSRCHRIPARLATEEELALCHSSKHISIIKSSEHMKPRDLNRLGDEYDSIFISNESYTCALLAAGSCFNSAQAILTGQVRNAVAIVRPPGHHAEKDTACGFCFFNTAALTARYAQSITRESLRVLIVDWDVHHGNGTQHIFEEDDSVLYISLHRYEDGAFFPNSEDANYDKVGLGKGRGYNVNIPWNGGKMGDPEYMAAFHHLVMPIAREFAPELVLVSAGFDAARGDPLGGFQVTPEGYAHLTHQLMSLAAGRVLIILEGGYNLTSISESM...
seq_be307890dd23905f77cdfafa
[ "2" ]
X-RAY DIFFRACTION
2.1
2026-06-17
0.978022
1
core
seq_cfa6024209130a23601f5d2d
struct_1aaf3c4c36263840
component_3f8b289bd5ed90ed
train
4
10ai_A
10aj_A
10aj
A
A
1
EGEEDDDKDFLWPAPNEEQVTCLKMYFGHSSFKPVQWKVIHSVLEERRDNVAVMATGYGKSLCFQYPPVYVGKIGLVISPLISLMEDQVLQLKMSNIPACFLGSAQSENVLTDIKLGKYRIVYVTPEYCSGNMGLLQQLEADIGITLIAVDEAHCISEWGHDFRDSFRKLGSLKTALPMVPIVALTATASSSIREDIVRCLNLRNPQITCTGFDRPNLYLEVRRKTGNILQDLQPFLVKTSSHWEFEGPTIIYCPSRKMTQQVTGELRKLNLSCGTYHAGMSFSTRKDIHHRFVRDEIQCVIATIAFGMGINKADIRQVI...
seq_969b6ab0389096c0ca7d14c4
[ "1" ]
X-RAY DIFFRACTION
2.42
2026-05-13
0.981352
1
core
seq_6b5dc3d2f02938658e1ad124
struct_7c2bc6b12135584b
component_3f8b289bd5ed90ed
train
1
10aj_A
10ak_A
10ak
A
A
1
ANEGEEDDDKDFLWPAPNEEQVTCLKMYFGHSSFKPVQWKVIHSVLEERRDNVAVMATGYGKSLCFQYPPVYVGKIGLVISPLISLMEDQVLQLKMSNIPACFLGSAQSENVLTDIKLGKYRIVYVTPEYCSGNMGLLQQLEADIGITLIAVDEAHCISEWGHDFRDSFRKLGSLKTALPMVPIVALTATASSSIREDIVRCLNLRNPQITCTGFDRPNLYLEVRRKTGNILQDLQPFLVKTSSHWEFEGPTIIYCPSRKMTQQVTGELRKLNLSCGTYHAGMSFSTRKDIHHRFVRDEIQCVIATIAFGMGINKADIRQ...
seq_e98bb0f99dbe86d18f6abe12
[ "1" ]
X-RAY DIFFRACTION
1.368
2026-05-13
0.981439
1
core
seq_6b5dc3d2f02938658e1ad124
struct_7c2bc6b12135584b
component_3f8b289bd5ed90ed
train
1
10ak_A
10ap_A
10ap
A
A
1
NLGLPTKEEEEDDENEANEGEEDDDKDFLWPAPNEEQVTCLKMYFGHSSFKPVQWKVIHSVLEERRDNVAVMATGYGKSLCFQYPPVYVGKIGLVISPLISLMEDQVLQLKMSNIPACFLGSAQSENVLTDIKLGKYRIVYVTPEYCSGNMGLLQQLEADIGITLIAVDEAHCISEWGHDFRDSFRKLGSLKTALPMVPIVALTATASSSIREDIVRCLNLRNPQITCTGFDRPNLYLEVRRKTGNILQDLQPFLVKTSSHWEFEGPTIIYCPSRKMTQQVTGELRKLNLSCGTYHAGMSFSTRKDIHHRFVRDEIQCVI...
seq_25ac36d46f06caa0a785c928
[ "1" ]
X-RAY DIFFRACTION
2.58
2026-05-13
0.941834
1
core
seq_6b5dc3d2f02938658e1ad124
struct_7c2bc6b12135584b
component_3f8b289bd5ed90ed
train
1
10ap_A
10ay_A
10ay
A
A
1
GKPPQRSIDKPFRLCVSDVFKDQGSGFCITGKIEAGYIQTGDRLLAMPPNETCTVKGITLHDEPVDWAAAGDHVSLTLVGMDIIKINVGCIFCGPKVPIKACTRFRARILIFNIEIPITKGFPVLLHYQTVSEPAVIKRLISVLNKSTGEVTKKKPKFLTKGQNALVELQTQRPIALELYKDFKELGRFMLRYGGSTIAAGVVTEIKE
seq_caa15a978f7aecfe1173252e
[ "1" ]
ELECTRON MICROSCOPY
2.9
2026-04-22
0.480769
1
low_quality
seq_2a3a0c3d94c6dfb72d13aa27
struct_4b2f87d2128982a9
component_3f8b289bd5ed90ed
train
4
11mr_A
10ay_B
10ay
B
B
2
GEAKKPNIINFDTSLPTSHTYLGADMEEFHGRTLHDDDSCQVIPVLPQVMMILIPGQTLPLQLFHPQEVSMVRNLIQKDRTFAVLAYSNVQEREAQFGTTAEIYAYREEQDFGIEIVKVKAIGRQRFKVLELRTQSDGIQQAKVQILPECVLPSTMSAVQLESLNKCQIFPSKPVSREDQCSYKWWQKYQKRKFHCANLTSWPRWLYSLYDAETLMDRIKKQLREWDENLKDDSLPSNPIDFSYRVAACLPIDDVLRIQLLKIGSAIQRLRCELDIMNKCTSLCCKQCQETEITTKNEIFSLSLCGPMAAYVNPHGYVHE...
seq_37b13dc80e4e5a333356c5b3
[ "1" ]
ELECTRON MICROSCOPY
2.9
2026-04-22
0.943069
1
core
seq_c3f3cae45b879e67d691f7f2
struct_0662d7fab350333a
component_3f8b289bd5ed90ed
train
4
11mr_B
10ay_C
10ay
C
C
3
MSYNYVVTAQKPTAVNGCVTGHFTSAEDLNLLIAKNTRLEIYVVTAEGLRPVKEVGMYGKIAVMELFRPKGESKDLLFILTAKYNACILEYKQSGESIDIITRAHGNVQDRIGRPSETGIIGIIDPECRMIGLRLYDGLFKVIPLDRDNKELKAFNIRLEELHVIDVKFLYGCQAPTICFVYQDPQGRHVKTYEVSLREKEFNKGPWKQENVEAEASMVIAVPEPFGGAIIIGQESITYHNGDKYLAIAPPIIKQSTIVCHNRVDPNGSRYLLGDMEGRLFMLLLEKEEQMDGTVTLKDLRVELLGETSIAECLTYLDNG...
seq_80be356aef4f71329822694d
[ "1" ]
ELECTRON MICROSCOPY
2.9
2026-04-22
0.687719
1
extended
seq_0b1744cbd74dc2a14a5c400a
struct_a8a537e9c54fb73b
component_3f8b289bd5ed90ed
train
75
3e0c_A
10ay_D
10ay
D
D
1
GKPPQRSIDKPFRLCVSDVFKDQGSGFCITGKIEAGYIQTGDRLLAMPPNETCTVKGITLHDEPVDWAAAGDHVSLTLVGMDIIKINVGCIFCGPKVPIKACTRFRARILIFNIEIPITKGFPVLLHYQTVSEPAVIKRLISVLNKSTGEVTKKKPKFLTKGQNALVELQTQRPIALELYKDFKELGRFMLRYGGSTIAAGVVTEIKE
seq_caa15a978f7aecfe1173252e
[ "1" ]
ELECTRON MICROSCOPY
2.9
2026-04-22
0.461538
1
low_quality
seq_2a3a0c3d94c6dfb72d13aa27
struct_4b2f87d2128982a9
component_3f8b289bd5ed90ed
train
4
11mr_A
10ay_E
10ay
E
E
2
GEAKKPNIINFDTSLPTSHTYLGADMEEFHGRTLHDDDSCQVIPVLPQVMMILIPGQTLPLQLFHPQEVSMVRNLIQKDRTFAVLAYSNVQEREAQFGTTAEIYAYREEQDFGIEIVKVKAIGRQRFKVLELRTQSDGIQQAKVQILPECVLPSTMSAVQLESLNKCQIFPSKPVSREDQCSYKWWQKYQKRKFHCANLTSWPRWLYSLYDAETLMDRIKKQLREWDENLKDDSLPSNPIDFSYRVAACLPIDDVLRIQLLKIGSAIQRLRCELDIMNKCTSLCCKQCQETEITTKNEIFSLSLCGPMAAYVNPHGYVHE...
seq_37b13dc80e4e5a333356c5b3
[ "1" ]
ELECTRON MICROSCOPY
2.9
2026-04-22
0.943069
1
core
seq_c3f3cae45b879e67d691f7f2
struct_0662d7fab350333a
component_3f8b289bd5ed90ed
train
4
11mr_B
10ay_F
10ay
F
F
3
MSYNYVVTAQKPTAVNGCVTGHFTSAEDLNLLIAKNTRLEIYVVTAEGLRPVKEVGMYGKIAVMELFRPKGESKDLLFILTAKYNACILEYKQSGESIDIITRAHGNVQDRIGRPSETGIIGIIDPECRMIGLRLYDGLFKVIPLDRDNKELKAFNIRLEELHVIDVKFLYGCQAPTICFVYQDPQGRHVKTYEVSLREKEFNKGPWKQENVEAEASMVIAVPEPFGGAIIIGQESITYHNGDKYLAIAPPIIKQSTIVCHNRVDPNGSRYLLGDMEGRLFMLLLEKEEQMDGTVTLKDLRVELLGETSIAECLTYLDNG...
seq_80be356aef4f71329822694d
[ "1" ]
ELECTRON MICROSCOPY
2.9
2026-04-22
0.685965
1
extended
seq_0b1744cbd74dc2a14a5c400a
struct_a8a537e9c54fb73b
component_3f8b289bd5ed90ed
train
75
3e0c_A
10be_C
10be
C
A
3
GAMGSMDYKDDDDKMYSGAGPALAPPAPPPPIQGYAFKPPPRPDFGTSGRTIKLQANFFEMDIPKIDIYHYELDIKPEKCPRRVNREIVEHMVQHFKTQIFGDRKPVFDGRKNLYTAMPLPIGRDKVELEVTLPGEGKDRIFKVSIKWVSCVSLQALHDALSGRLPSVPFETIQALDVVMRHLPSMRYTPVGRSFFTASEGCSNPLGGGREVWFGFHQSVRPSLWKMMLNIDVSATAFYKAQPVIEFVCEVLDFKSIEEQQKPLTDSQRVKFTKEIKGLKVEITHCGQMKRKYRVCNVTRRPASHQTFPLQQESGQTVEC...
seq_96fd5a59357343cf7a22afc0
[ "1" ]
ELECTRON MICROSCOPY
3.02
2026-06-03
0.907216
1
core
seq_4bd5ef67c7a40efa13266d24
struct_fb89371558e09729
component_3f8b289bd5ed90ed
train
1
10be_C
10bl_A
10bl
A
A
1
MEKVTKDDFESLDVLGKGSFAYVVLVRRIGTNEYYAMKVVNKQGLLDHNRYRDVFVERNVLSRINHPYLLKLYWTFQSEHKLFFVMEYMPGGDLDKYMNNLPSKQFDLFTAKLYAAEILLALLFLHEHSVIYRDLKPENILLTGDGHCVLADFGLSKDFYNPKEGGDASTKDMRANSFVGSPFYVAPDVLKQSEYTNAVDFWSFGILLYRMLCGRTPFNGKSMREVFDNILYSDLRFPSSVQLPSEAKDLISRLLIKDANRRIKGPEIKAHLFWTGINFDEVMERKVKPPKWVPIPSPEQVMAERAKAEGASTSAKNPGQ...
seq_ce9fe9a75ebf0fd5af718434
[ "1" ]
X-RAY DIFFRACTION
2.6
2026-01-21
0.925208
1
core
seq_c2e80c6e24279dcc21792c38
struct_bbe510513bfc4bc5
component_3f8b289bd5ed90ed
train
10
10bl_A
10bl_B
10bl
B
B
1
MEKVTKDDFESLDVLGKGSFAYVVLVRRIGTNEYYAMKVVNKQGLLDHNRYRDVFVERNVLSRINHPYLLKLYWTFQSEHKLFFVMEYMPGGDLDKYMNNLPSKQFDLFTAKLYAAEILLALLFLHEHSVIYRDLKPENILLTGDGHCVLADFGLSKDFYNPKEGGDASTKDMRANSFVGSPFYVAPDVLKQSEYTNAVDFWSFGILLYRMLCGRTPFNGKSMREVFDNILYSDLRFPSSVQLPSEAKDLISRLLIKDANRRIKGPEIKAHLFWTGINFDEVMERKVKPPKWVPIPSPEQVMAERAKAEGASTSAKNPGQ...
seq_ce9fe9a75ebf0fd5af718434
[ "1" ]
X-RAY DIFFRACTION
2.6
2026-01-21
0.894737
1
core
seq_c2e80c6e24279dcc21792c38
struct_bbe510513bfc4bc5
component_3f8b289bd5ed90ed
train
10
10bl_A
10bm_A
10bm
A
A
1
MAHHHHHHSPILPGAWLGMVGGGQLGRMFCFAAQAMGYRVAVLDPDENSPAGAVADRHLRAAYNDEASLTELARLCAAVSTEFENVPAASLDFLARTTFVSPAGRCVAVAQDRIAEKRFIASSGVTVAPHVVIESSDALAALDDAKLEAVLPGILKTARMGYDGKGQIRVRNAEEVREAHASLAGVPCVLEKRLPLKFEVSALIARAASGASVVYPLAQNTHRDGVLSHTIVPAPDASPTLVQQAQQAALQIADKLGYVGVLCVEFFILEDGSLVANEMAPRPHNSGHYTVDACATSQFEQQVRAMTGMPLGDTRQHSPA...
seq_cddf9cb4fec978452f2d8fd7
[ "1" ]
X-RAY DIFFRACTION
2.49
2026-01-21
0.97733
1
core
seq_3bcb3f500f24a67384287a21
struct_f42856f5e6985860
component_3f8b289bd5ed90ed
train
18
9zoi_A
10bm_B
10bm
B
B
1
MAHHHHHHSPILPGAWLGMVGGGQLGRMFCFAAQAMGYRVAVLDPDENSPAGAVADRHLRAAYNDEASLTELARLCAAVSTEFENVPAASLDFLARTTFVSPAGRCVAVAQDRIAEKRFIASSGVTVAPHVVIESSDALAALDDAKLEAVLPGILKTARMGYDGKGQIRVRNAEEVREAHASLAGVPCVLEKRLPLKFEVSALIARAASGASVVYPLAQNTHRDGVLSHTIVPAPDASPTLVQQAQQAALQIADKLGYVGVLCVEFFILEDGSLVANEMAPRPHNSGHYTVDACATSQFEQQVRAMTGMPLGDTRQHSPA...
seq_cddf9cb4fec978452f2d8fd7
[ "2" ]
X-RAY DIFFRACTION
2.49
2026-01-21
0.964736
1
core
seq_3bcb3f500f24a67384287a21
struct_f42856f5e6985860
component_3f8b289bd5ed90ed
train
18
9zoi_A
10bm_C
10bm
C
C
1
MAHHHHHHSPILPGAWLGMVGGGQLGRMFCFAAQAMGYRVAVLDPDENSPAGAVADRHLRAAYNDEASLTELARLCAAVSTEFENVPAASLDFLARTTFVSPAGRCVAVAQDRIAEKRFIASSGVTVAPHVVIESSDALAALDDAKLEAVLPGILKTARMGYDGKGQIRVRNAEEVREAHASLAGVPCVLEKRLPLKFEVSALIARAASGASVVYPLAQNTHRDGVLSHTIVPAPDASPTLVQQAQQAALQIADKLGYVGVLCVEFFILEDGSLVANEMAPRPHNSGHYTVDACATSQFEQQVRAMTGMPLGDTRQHSPA...
seq_cddf9cb4fec978452f2d8fd7
[ "3" ]
X-RAY DIFFRACTION
2.49
2026-01-21
0.979849
1
core
seq_3bcb3f500f24a67384287a21
struct_f42856f5e6985860
component_3f8b289bd5ed90ed
train
18
9zoi_A
10bm_D
10bm
D
D
1
MAHHHHHHSPILPGAWLGMVGGGQLGRMFCFAAQAMGYRVAVLDPDENSPAGAVADRHLRAAYNDEASLTELARLCAAVSTEFENVPAASLDFLARTTFVSPAGRCVAVAQDRIAEKRFIASSGVTVAPHVVIESSDALAALDDAKLEAVLPGILKTARMGYDGKGQIRVRNAEEVREAHASLAGVPCVLEKRLPLKFEVSALIARAASGASVVYPLAQNTHRDGVLSHTIVPAPDASPTLVQQAQQAALQIADKLGYVGVLCVEFFILEDGSLVANEMAPRPHNSGHYTVDACATSQFEQQVRAMTGMPLGDTRQHSPA...
seq_cddf9cb4fec978452f2d8fd7
[ "4" ]
X-RAY DIFFRACTION
2.49
2026-01-21
0.967254
1
core
seq_3bcb3f500f24a67384287a21
struct_f42856f5e6985860
component_3f8b289bd5ed90ed
train
18
9zoi_A
10br_A
10br
A
A
1
GPLGSIESAWLGISFYPLKTRDSEVLKSLGVESNDVSAAIIASLYPGSPAVKSGLRAGDIIMKVNGVSMSVFQDVTSYISDFYAGEKVNVEILRGNVKKNIEIVLAVRPKDKELSSSKMLPGFVVYPLVEDIKAQLNLRNWIKGVVVDYIDKNLASNIKMKSGDVILSVNSKSVSNLREFYDALEVGKNTYKILRGNDSFKITF
seq_86769b4f7e15dccaa1580cc4
[ "1" ]
X-RAY DIFFRACTION
1.5
2026-06-17
1
1
core
seq_86769b4f7e15dccaa1580cc4
struct_905e0881dd84d01e
component_56c9ada516b64618
train
4
10br_A
10br_B
10br
B
B
1
GPLGSIESAWLGISFYPLKTRDSEVLKSLGVESNDVSAAIIASLYPGSPAVKSGLRAGDIIMKVNGVSMSVFQDVTSYISDFYAGEKVNVEILRGNVKKNIEIVLAVRPKDKELSSSKMLPGFVVYPLVEDIKAQLNLRNWIKGVVVDYIDKNLASNIKMKSGDVILSVNSKSVSNLREFYDALEVGKNTYKILRGNDSFKITF
seq_86769b4f7e15dccaa1580cc4
[ "1" ]
X-RAY DIFFRACTION
1.5
2026-06-17
0.97549
1
core
seq_86769b4f7e15dccaa1580cc4
struct_905e0881dd84d01e
component_56c9ada516b64618
train
4
10br_A
10br_C
10br
C
C
1
GPLGSIESAWLGISFYPLKTRDSEVLKSLGVESNDVSAAIIASLYPGSPAVKSGLRAGDIIMKVNGVSMSVFQDVTSYISDFYAGEKVNVEILRGNVKKNIEIVLAVRPKDKELSSSKMLPGFVVYPLVEDIKAQLNLRNWIKGVVVDYIDKNLASNIKMKSGDVILSVNSKSVSNLREFYDALEVGKNTYKILRGNDSFKITF
seq_86769b4f7e15dccaa1580cc4
[ "2" ]
X-RAY DIFFRACTION
1.5
2026-06-17
0.97549
1
core
seq_86769b4f7e15dccaa1580cc4
struct_905e0881dd84d01e
component_56c9ada516b64618
train
4
10br_A
10br_D
10br
D
D
1
GPLGSIESAWLGISFYPLKTRDSEVLKSLGVESNDVSAAIIASLYPGSPAVKSGLRAGDIIMKVNGVSMSVFQDVTSYISDFYAGEKVNVEILRGNVKKNIEIVLAVRPKDKELSSSKMLPGFVVYPLVEDIKAQLNLRNWIKGVVVDYIDKNLASNIKMKSGDVILSVNSKSVSNLREFYDALEVGKNTYKILRGNDSFKITF
seq_86769b4f7e15dccaa1580cc4
[ "2" ]
X-RAY DIFFRACTION
1.5
2026-06-17
1
1
core
seq_86769b4f7e15dccaa1580cc4
struct_905e0881dd84d01e
component_56c9ada516b64618
train
4
10br_A
10bt_A
10bt
A
A
1
EVKLEESGGGLVQPGGSMRLSCVASGFTFSNYWMNWVRQSPEKGLEWVAEIRLKSNNYATHYAESVKGRFTISRDDSTSSGYLQMNNLRTEDTGIHYCTLTLITDYDVMEYWGQGTSVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSCDKTHHHHHH
seq_52a0661b7733bda7e68395ad
[ "1" ]
X-RAY DIFFRACTION
1.99
2026-06-10
0.952991
1
core
seq_18e826e63cb5b287c0599278
struct_277beb1d82fc6a91
component_3f8b289bd5ed90ed
train
4
10bt_A
10bt_B
10bt
B
B
1
EVKLEESGGGLVQPGGSMRLSCVASGFTFSNYWMNWVRQSPEKGLEWVAEIRLKSNNYATHYAESVKGRFTISRDDSTSSGYLQMNNLRTEDTGIHYCTLTLITDYDVMEYWGQGTSVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSCDKTHHHHHH
seq_52a0661b7733bda7e68395ad
[ "2" ]
X-RAY DIFFRACTION
1.99
2026-06-10
0.940171
1
core
seq_18e826e63cb5b287c0599278
struct_f1cc39e7021627f2
component_3f8b289bd5ed90ed
train
4
10bt_A
10bt_C
10bt
C
C
1
EVKLEESGGGLVQPGGSMRLSCVASGFTFSNYWMNWVRQSPEKGLEWVAEIRLKSNNYATHYAESVKGRFTISRDDSTSSGYLQMNNLRTEDTGIHYCTLTLITDYDVMEYWGQGTSVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSCDKTHHHHHH
seq_52a0661b7733bda7e68395ad
[ "3" ]
X-RAY DIFFRACTION
1.99
2026-06-10
0.91453
1
core
seq_18e826e63cb5b287c0599278
struct_277beb1d82fc6a91
component_3f8b289bd5ed90ed
train
4
10bt_A
10bt_D
10bt
D
D
1
EVKLEESGGGLVQPGGSMRLSCVASGFTFSNYWMNWVRQSPEKGLEWVAEIRLKSNNYATHYAESVKGRFTISRDDSTSSGYLQMNNLRTEDTGIHYCTLTLITDYDVMEYWGQGTSVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSCDKTHHHHHH
seq_52a0661b7733bda7e68395ad
[ "4" ]
X-RAY DIFFRACTION
1.99
2026-06-10
0.940171
1
core
seq_18e826e63cb5b287c0599278
struct_277beb1d82fc6a91
component_3f8b289bd5ed90ed
train
4
10bt_A
10bt_E
10bt
E
E
2
DIQMTQSPSSLSASLGGKVTITCKANQDINKYIAWYQHKPGQGPRLLIHYASALQPGIPSRFSGSGSGRDYSFSISNLEPEDIATYYCLQYDNLYTFGGGTKLEIKRARTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC
seq_157d00c820376fd723c3d257
[ "1" ]
X-RAY DIFFRACTION
1.99
2026-06-10
1
1
core
seq_67bd7e2cba6e8d057f61d4fb
struct_69c04d1a82b73f90
component_3f8b289bd5ed90ed
train
4
10bt_E
10bt_F
10bt
F
F
2
DIQMTQSPSSLSASLGGKVTITCKANQDINKYIAWYQHKPGQGPRLLIHYASALQPGIPSRFSGSGSGRDYSFSISNLEPEDIATYYCLQYDNLYTFGGGTKLEIKRARTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC
seq_157d00c820376fd723c3d257
[ "2" ]
X-RAY DIFFRACTION
1.99
2026-06-10
1
1
core
seq_67bd7e2cba6e8d057f61d4fb
struct_69c04d1a82b73f90
component_3f8b289bd5ed90ed
train
4
10bt_E
10bt_G
10bt
G
G
2
DIQMTQSPSSLSASLGGKVTITCKANQDINKYIAWYQHKPGQGPRLLIHYASALQPGIPSRFSGSGSGRDYSFSISNLEPEDIATYYCLQYDNLYTFGGGTKLEIKRARTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC
seq_157d00c820376fd723c3d257
[ "3" ]
X-RAY DIFFRACTION
1.99
2026-06-10
1
1
core
seq_67bd7e2cba6e8d057f61d4fb
struct_69c04d1a82b73f90
component_3f8b289bd5ed90ed
train
4
10bt_E
10bt_H
10bt
H
H
2
DIQMTQSPSSLSASLGGKVTITCKANQDINKYIAWYQHKPGQGPRLLIHYASALQPGIPSRFSGSGSGRDYSFSISNLEPEDIATYYCLQYDNLYTFGGGTKLEIKRARTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC
seq_157d00c820376fd723c3d257
[ "4" ]
X-RAY DIFFRACTION
1.99
2026-06-10
1
1
core
seq_67bd7e2cba6e8d057f61d4fb
struct_69c04d1a82b73f90
component_3f8b289bd5ed90ed
train
4
10bt_E
10bu_A
10bu
A
A
1
MMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSTGEIPAPLAGTVSKILVKEGDTVKAGQTVLVLEAMKMETEINAPTDGKVEKVLVKERDAVQGGQGLIKIGGGTP...
seq_9f36cbab56bf103bcb6f152d
[ "1" ]
ELECTRON MICROSCOPY
3.2
2026-05-27
0.998991
1
core
seq_b360e235ec9237254a4dc51a
struct_f23e1e64a56e6400
component_3f8b289bd5ed90ed
train
3
10bu_A
10bu_B
10bu
B
B
1
MMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSTGEIPAPLAGTVSKILVKEGDTVKAGQTVLVLEAMKMETEINAPTDGKVEKVLVKERDAVQGGQGLIKIGGGTP...
seq_9f36cbab56bf103bcb6f152d
[ "1" ]
ELECTRON MICROSCOPY
3.2
2026-05-27
0.998991
1
core
seq_b360e235ec9237254a4dc51a
struct_f23e1e64a56e6400
component_3f8b289bd5ed90ed
train
3
10bu_A
10bu_C
10bu
C
C
1
MMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSTGEIPAPLAGTVSKILVKEGDTVKAGQTVLVLEAMKMETEINAPTDGKVEKVLVKERDAVQGGQGLIKIGGGTP...
seq_9f36cbab56bf103bcb6f152d
[ "1" ]
ELECTRON MICROSCOPY
3.2
2026-05-27
0.995964
1
core
seq_b360e235ec9237254a4dc51a
struct_f23e1e64a56e6400
component_3f8b289bd5ed90ed
train
3
10bu_A
30bt_A
30bt
A
A
1
MIAAPLVRVTLAYICGLLLASRITVGPVQLLALTVILWTLAYLFRQPPRRAAWQAFLLAGFMALGLLISTWDSSHHQSRLTGDRGTFLDLSGTVIEEPRVYANRVVYTLATREIRQGDYHKRVKEKVQVVLYRPAEGGEPELYRYGDVLRVHGQLAAPPAARNPGELDYRAYLARQYIYNRMLINDPRAIVKLGTVPGHPLVRLALGAKARVKTVITAALPPRQAGILAALLFGDVNELTDTDSDTFKNLGVFHFFAVSGSNTALVLLILMAIAGFLGLERSGAVFLGLAGLIFYAAVTGFTPSVSRAGIMAGLGLIAYL...
seq_52af76c97b47f395dd15cf86
[ "1" ]
ELECTRON MICROSCOPY
4.2
2026-05-20
0.340824
1
low_quality
seq_52af76c97b47f395dd15cf86
struct_5f54bba25646e9a1
component_3f8b289bd5ed90ed
train
3
30bu_A
30bu_A
30bu
A
A
1
MIAAPLVRVTLAYICGLLLASRITVGPVQLLALTVILWTLAYLFRQPPRRAAWQAFLLAGFMALGLLISTWDSSHHQSRLTGDRGTFLDLSGTVIEEPRVYANRVVYTLATREIRQGDYHKRVKEKVQVVLYRPAEGGEPELYRYGDVLRVHGQLAAPPAARNPGELDYRAYLARQYIYNRMLINDPRAIVKLGTVPGHPLVRLALGAKARVKTVITAALPPRQAGILAALLFGDVNELTDTDSDTFKNLGVFHFFAVSGSNTALVLLILMAIAGFLGLERSGAVFLGLAGLIFYAAVTGFTPSVSRAGIMAGLGLIAYL...
seq_52af76c97b47f395dd15cf86
[ "1" ]
ELECTRON MICROSCOPY
4.1
2026-05-20
0.659176
1
extended
seq_52af76c97b47f395dd15cf86
struct_83ec445fdf12ee88
component_3f8b289bd5ed90ed
train
3
30bu_A
30bu_B
30bu
B
B
1
MIAAPLVRVTLAYICGLLLASRITVGPVQLLALTVILWTLAYLFRQPPRRAAWQAFLLAGFMALGLLISTWDSSHHQSRLTGDRGTFLDLSGTVIEEPRVYANRVVYTLATREIRQGDYHKRVKEKVQVVLYRPAEGGEPELYRYGDVLRVHGQLAAPPAARNPGELDYRAYLARQYIYNRMLINDPRAIVKLGTVPGHPLVRLALGAKARVKTVITAALPPRQAGILAALLFGDVNELTDTDSDTFKNLGVFHFFAVSGSNTALVLLILMAIAGFLGLERSGAVFLGLAGLIFYAAVTGFTPSVSRAGIMAGLGLIAYL...
seq_52af76c97b47f395dd15cf86
[ "1" ]
ELECTRON MICROSCOPY
4.1
2026-05-20
0.619226
1
extended
seq_52af76c97b47f395dd15cf86
struct_83ec445fdf12ee88
component_3f8b289bd5ed90ed
train
3
30bu_A
10dc_A
10dc
A
A
1
MTEYKLVVVGAGGVGKSALTIQLIQNHFVDEYDPTIEDSYRKQVVIDGETCLLDILDTAGQEEYSAMADQYMRTGEGFLCVFAINNTKSFEDIHQYREQIKRVKDSDDVPMVLVGNKCDLAARTVESRQAQDLARSYGIPYIETSAKTRQGVEDAFYTLVREIRQH
seq_04fdee737523926977ff5491
[ "1" ]
X-RAY DIFFRACTION
2.08
2026-02-11
0.975904
1
core
seq_747ca141edd1a6d25946ca51
struct_04fe40d84ea9653a
component_3f8b289bd5ed90ed
train
1
10dc_A
10dj_A
10dj
A
A
1
VWEIPRESLQLIKRLGNGQFGEVWMGTWNGNTKVAIKTLKPGTMSPESFLEEAQIMKKLKHDKLVQLYAVVSEEPIYIVTEYMNKGSLLDFLKDGEGRALKLPNLVDMAAQVAAGMAYIERMNYIHRDLRSANILVGNGLICKIADFGLARLIEDNEYTARQGAKFPIKWTAPEAALYGRFTIKSDVWSFGILLTELVTKGRVPYPGMNNREVLEQVERGYRMPCPQDCPISLHELMIHCWKKDPEERPTFEYLQSFLEDYFTATEPQYQPGENLVDENLYF
seq_925babf455e1a2da5207ed61
[ "1" ]
X-RAY DIFFRACTION
2.22
2026-03-18
0.953901
1
core
seq_49d757fa60ff99b0d2bc2a03
struct_d38926c0a86ec433
component_3f8b289bd5ed90ed
train
2
10dj_B
10dj_B
10dj
B
B
1
VWEIPRESLQLIKRLGNGQFGEVWMGTWNGNTKVAIKTLKPGTMSPESFLEEAQIMKKLKHDKLVQLYAVVSEEPIYIVTEYMNKGSLLDFLKDGEGRALKLPNLVDMAAQVAAGMAYIERMNYIHRDLRSANILVGNGLICKIADFGLARLIEDNEYTARQGAKFPIKWTAPEAALYGRFTIKSDVWSFGILLTELVTKGRVPYPGMNNREVLEQVERGYRMPCPQDCPISLHELMIHCWKKDPEERPTFEYLQSFLEDYFTATEPQYQPGENLVDENLYF
seq_925babf455e1a2da5207ed61
[ "2" ]
X-RAY DIFFRACTION
2.22
2026-03-18
0.98227
1
core
seq_49d757fa60ff99b0d2bc2a03
struct_d38926c0a86ec433
component_3f8b289bd5ed90ed
train
2
10dj_B
10dk_A
10dk
A
A
1
MATPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSSGGTPKLVLYSEDVNMETPDTHLSYKPGKSDDNSKAMLGQQSMPNRPNYIAFRDNFIGLMYYNSTGNMG...
seq_0e2ee9f45935c6263d849e83
[ "1" ]
ELECTRON MICROSCOPY
3.22
2026-05-27
0.9946
1
core
seq_b360e235ec9237254a4dc51a
struct_f23e1e64a56e6400
component_3f8b289bd5ed90ed
train
3
10dk_B
10dk_B
10dk
B
B
1
MATPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSSGGTPKLVLYSEDVNMETPDTHLSYKPGKSDDNSKAMLGQQSMPNRPNYIAFRDNFIGLMYYNSTGNMG...
seq_0e2ee9f45935c6263d849e83
[ "1" ]
ELECTRON MICROSCOPY
3.22
2026-05-27
0.99568
1
core
seq_b360e235ec9237254a4dc51a
struct_f23e1e64a56e6400
component_3f8b289bd5ed90ed
train
3
10dk_B
10dk_C
10dk
C
C
1
MATPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSSGGTPKLVLYSEDVNMETPDTHLSYKPGKSDDNSKAMLGQQSMPNRPNYIAFRDNFIGLMYYNSTGNMG...
seq_0e2ee9f45935c6263d849e83
[ "1" ]
ELECTRON MICROSCOPY
3.22
2026-05-27
0.9946
1
core
seq_b360e235ec9237254a4dc51a
struct_f23e1e64a56e6400
component_3f8b289bd5ed90ed
train
3
10dk_B
10dp_A
10dp
A
A
1
TPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDTQVQVAAEDDQDDDEEEEQLPQQRNGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSVNAMNEANAIQPKLLLYSEDVNMETPDTHLSYKPGKSDDNSKAMLG...
seq_6ec82d74f63c3dbd66c7a119
[ "1" ]
ELECTRON MICROSCOPY
3.25
2026-05-27
0.970711
1
core
seq_b360e235ec9237254a4dc51a
struct_f23e1e64a56e6400
component_3f8b289bd5ed90ed
train
3
10dp_A
10dp_B
10dp
B
B
1
TPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDTQVQVAAEDDQDDDEEEEQLPQQRNGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSVNAMNEANAIQPKLLLYSEDVNMETPDTHLSYKPGKSDDNSKAMLG...
seq_6ec82d74f63c3dbd66c7a119
[ "1" ]
ELECTRON MICROSCOPY
3.25
2026-05-27
0.970711
1
core
seq_b360e235ec9237254a4dc51a
struct_f23e1e64a56e6400
component_3f8b289bd5ed90ed
train
3
10dp_A
10dp_C
10dp
C
C
1
TPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDTQVQVAAEDDQDDDEEEEQLPQQRNGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSVNAMNEANAIQPKLLLYSEDVNMETPDTHLSYKPGKSDDNSKAMLG...
seq_6ec82d74f63c3dbd66c7a119
[ "1" ]
ELECTRON MICROSCOPY
3.25
2026-05-27
0.969665
1
core
seq_b360e235ec9237254a4dc51a
struct_f23e1e64a56e6400
component_3f8b289bd5ed90ed
train
3
10dp_A
10dv_A
10dv
A
A
1
SGFRKMAFPSGKVEGCMVQVTCGTTTLNGLWLDDVVYCPRHVICTSEDMLNPNYEDLLIRKSNHNFLVQAGNVQLRVIGHSMQNCVLKLKVDTANPKTPKYKFVRIQPGQTFSVLACYNGSPSGVYQCAMRPNFTIKGSFLNGSAGSVGFNIDYDCVSFCYMHHMELPTGVHAGTDLEGNFYGPFVDRQTAQAAGTDTTITVNVLAWLYAAVINGDRWFLNRFTTTLNDFNLVAMKYNYEPLTQDHVDILGPLSAQTGIAVLDMCASLKELLQNGMNGRTILGSALLEDEFTPFDVVRQCSGVTFQSAVMQYKLILNGKT...
seq_3f7754e0a895ca6e7a129a68
[ "1" ]
X-RAY DIFFRACTION
2.05
2026-05-06
0.806971
1
core
seq_2fdfb46ec3991cba6d737539
struct_b98635064a47290c
component_3f8b289bd5ed90ed
train
2
10dv_A
10dv_B
10dv
B
B
1
SGFRKMAFPSGKVEGCMVQVTCGTTTLNGLWLDDVVYCPRHVICTSEDMLNPNYEDLLIRKSNHNFLVQAGNVQLRVIGHSMQNCVLKLKVDTANPKTPKYKFVRIQPGQTFSVLACYNGSPSGVYQCAMRPNFTIKGSFLNGSAGSVGFNIDYDCVSFCYMHHMELPTGVHAGTDLEGNFYGPFVDRQTAQAAGTDTTITVNVLAWLYAAVINGDRWFLNRFTTTLNDFNLVAMKYNYEPLTQDHVDILGPLSAQTGIAVLDMCASLKELLQNGMNGRTILGSALLEDEFTPFDVVRQCSGVTFQSAVMQYKLILNGKT...
seq_3f7754e0a895ca6e7a129a68
[ "1" ]
X-RAY DIFFRACTION
2.05
2026-05-06
0.806971
1
core
seq_2fdfb46ec3991cba6d737539
struct_b98635064a47290c
component_3f8b289bd5ed90ed
train
2
10dv_A
10en_A
10en
A
A
1
KIVNIGAVLSTRKHEQMFREAVNQANKRHGSWKIQLNATSVTHKPNAIQMALSVCEDLISSQVYAILVSHPPTPNDHFTPTPVSYTAGFYRIPVLGLTTRMSIYSDKSIHLSFLRTVPPYSHQSSVWFEMMRVYSWNHIILLVSDDHEGRAAQKRLETLLEERESKAEKVLQFDPGTKNVTALLMEARELEARVIILSASEDDAATVYRAAAMLNMTGSGYVWLVGEREISGNALRYAPDGIIGLQLINGKNESAHISDAVGVVAQAVHELLEKENITDPPRGCVGNTNIWKTGPLFKRVLMSSKYADGVTGRVEFNEDG...
seq_7255603097ee423fed8b0c34
[ "1" ]
ELECTRON MICROSCOPY
3.7
2026-03-25
0.973072
1
core
seq_0c6927097c6f94558cbe12bb
struct_14d5849aae0a8126
component_3f8b289bd5ed90ed
train
6
10en_A
10en_B
10en
B
B
2
FHHLSVVPRVELVAMNETDPKSIITRICDLMSDRKIQGVVFADDTDQEAIAQILDFISAQTLTPILGIHGGSSMIMADKDESSMFFQFGPSIEQQASVMLNIMEEYDWYIFSIVTTYFPGYQDFVNKIRSTIENSFVGWELEEVLLLDMSLDDGDSKIQNQLKKLQSPIILLYCTKEEATYIFEVANSVGLTGYGYTWIVPSLVAGDTDTVPSEFPTGLISVSYDEWDYGLPARVRDGIAIITTAASDMLSEHSFIPEPKSSCYNTHEKRIYQSNMLNRYLINVTFEGRNLSFSEDGYQMHPKLVIILLNKERKWERVGK...
seq_0b21ed8660d006ae3b501226
[ "1" ]
ELECTRON MICROSCOPY
3.7
2026-03-25
0.955527
1
core
seq_c633012c5d9396303f6c3955
struct_5f99414d7af5f3ac
component_3f8b289bd5ed90ed
train
6
10en_B
10en_C
10en
C
C
1
KIVNIGAVLSTRKHEQMFREAVNQANKRHGSWKIQLNATSVTHKPNAIQMALSVCEDLISSQVYAILVSHPPTPNDHFTPTPVSYTAGFYRIPVLGLTTRMSIYSDKSIHLSFLRTVPPYSHQSSVWFEMMRVYSWNHIILLVSDDHEGRAAQKRLETLLEERESKAEKVLQFDPGTKNVTALLMEARELEARVIILSASEDDAATVYRAAAMLNMTGSGYVWLVGEREISGNALRYAPDGIIGLQLINGKNESAHISDAVGVVAQAVHELLEKENITDPPRGCVGNTNIWKTGPLFKRVLMSSKYADGVTGRVEFNEDG...
seq_7255603097ee423fed8b0c34
[ "1" ]
ELECTRON MICROSCOPY
3.7
2026-03-25
0.973072
1
core
seq_0c6927097c6f94558cbe12bb
struct_f9d265a2cd2aaab5
component_3f8b289bd5ed90ed
train
6
10en_A
10en_D
10en
D
D
2
FHHLSVVPRVELVAMNETDPKSIITRICDLMSDRKIQGVVFADDTDQEAIAQILDFISAQTLTPILGIHGGSSMIMADKDESSMFFQFGPSIEQQASVMLNIMEEYDWYIFSIVTTYFPGYQDFVNKIRSTIENSFVGWELEEVLLLDMSLDDGDSKIQNQLKKLQSPIILLYCTKEEATYIFEVANSVGLTGYGYTWIVPSLVAGDTDTVPSEFPTGLISVSYDEWDYGLPARVRDGIAIITTAASDMLSEHSFIPEPKSSCYNTHEKRIYQSNMLNRYLINVTFEGRNLSFSEDGYQMHPKLVIILLNKERKWERVGK...
seq_0b21ed8660d006ae3b501226
[ "1" ]
ELECTRON MICROSCOPY
3.7
2026-03-25
0.951715
1
core
seq_c633012c5d9396303f6c3955
struct_5f99414d7af5f3ac
component_3f8b289bd5ed90ed
train
6
10en_B
10en_E
10en
E
E
3
DIVLTQSPASLAVSLGQRATISCRASKSVSTSGYSYMNWYQQKAGQPPKLLIYLASNLESGVPARFSGSGSGTDFTLNIHPVEEEDAATYYCQHSRELPYTFGGGTKLEIK
seq_2a897060776f2ba361788d64
[ "1" ]
ELECTRON MICROSCOPY
3.7
2026-03-25
1
1
core
seq_392b87a60783b379b79fea27
struct_05d89e0f8014586e
component_3f8b289bd5ed90ed
train
2
10en_E
10en_F
10en
F
F
4
EVQLQQSGPELVKPGASVKMSCKASGYTFTSYVMHWVKQKPGQGLEWIGYINPYSDGTNYNEKFKGKATLTSDKSSSTAYMELSSLTSEDSAVYYCARLTTVVEGAMDYWGQGTSVTVSS
seq_8e8866012ad1f1eb43f44e6d
[ "1" ]
ELECTRON MICROSCOPY
3.7
2026-03-25
1
1
core
seq_12249a9611cfdc161bfe7e1c
struct_e1bd67264b90f9fa
component_3f8b289bd5ed90ed
train
2
10en_F
10en_G
10en
G
I
3
DIVLTQSPASLAVSLGQRATISCRASKSVSTSGYSYMNWYQQKAGQPPKLLIYLASNLESGVPARFSGSGSGTDFTLNIHPVEEEDAATYYCQHSRELPYTFGGGTKLEIK
seq_2a897060776f2ba361788d64
[ "1" ]
ELECTRON MICROSCOPY
3.7
2026-03-25
1
1
core
seq_392b87a60783b379b79fea27
struct_05d89e0f8014586e
component_3f8b289bd5ed90ed
train
2
10en_E
10en_H
10en
H
J
4
EVQLQQSGPELVKPGASVKMSCKASGYTFTSYVMHWVKQKPGQGLEWIGYINPYSDGTNYNEKFKGKATLTSDKSSSTAYMELSSLTSEDSAVYYCARLTTVVEGAMDYWGQGTSVTVSS
seq_8e8866012ad1f1eb43f44e6d
[ "1" ]
ELECTRON MICROSCOPY
3.7
2026-03-25
1
1
core
seq_12249a9611cfdc161bfe7e1c
struct_c062861de08ab299
component_3f8b289bd5ed90ed
train
2
10en_F
10eo_A
10eo
A
A
1
ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV...
seq_d61026e47f4265b59f0b86a6
[ "1" ]
ELECTRON MICROSCOPY
3.2
2026-05-27
0.889746
1
core
seq_bb3a0a9b067359c4dba1d607
struct_f388146ed7cea03a
component_3f8b289bd5ed90ed
train
6
10eo_A
10eo_B
10eo
B
B
1
ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV...
seq_d61026e47f4265b59f0b86a6
[ "1" ]
ELECTRON MICROSCOPY
3.2
2026-05-27
0.889746
1
core
seq_bb3a0a9b067359c4dba1d607
struct_f388146ed7cea03a
component_3f8b289bd5ed90ed
train
6
10eo_A
10ep_A
10ep
A
B
1
ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV...
seq_d61026e47f4265b59f0b86a6
[ "1" ]
ELECTRON MICROSCOPY
3.2
2026-05-27
0.889746
1
core
seq_bb3a0a9b067359c4dba1d607
struct_f388146ed7cea03a
component_3f8b289bd5ed90ed
train
6
10eo_A
10ep_B
10ep
B
A
1
ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV...
seq_d61026e47f4265b59f0b86a6
[ "1" ]
ELECTRON MICROSCOPY
3.2
2026-05-27
0.878721
1
core
seq_bb3a0a9b067359c4dba1d607
struct_f388146ed7cea03a
component_3f8b289bd5ed90ed
train
6
10eo_A
10eq_A
10eq
A
A
1
HHHHHHGGASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVP...
seq_ecae2105c114f891ff4a7502
[ "1" ]
ELECTRON MICROSCOPY
3.3
2026-05-27
0.679162
1
extended
seq_bb3a0a9b067359c4dba1d607
struct_f388146ed7cea03a
component_3f8b289bd5ed90ed
train
4
10es_A
10eq_B
10eq
B
B
1
HHHHHHGGASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVP...
seq_ecae2105c114f891ff4a7502
[ "1" ]
ELECTRON MICROSCOPY
3.3
2026-05-27
0.888644
1
core
seq_bb3a0a9b067359c4dba1d607
struct_f388146ed7cea03a
component_3f8b289bd5ed90ed
train
4
10es_A
10er_A
10er
A
B
1
ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV...
seq_d61026e47f4265b59f0b86a6
[ "1" ]
ELECTRON MICROSCOPY
3.2
2026-05-27
0.878721
1
core
seq_bb3a0a9b067359c4dba1d607
struct_f388146ed7cea03a
component_3f8b289bd5ed90ed
train
6
10eo_A
10er_B
10er
B
A
1
ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV...
seq_d61026e47f4265b59f0b86a6
[ "1" ]
ELECTRON MICROSCOPY
3.2
2026-05-27
0.878721
1
core
seq_bb3a0a9b067359c4dba1d607
struct_f388146ed7cea03a
component_3f8b289bd5ed90ed
train
6
10eo_A
10es_A
10es
A
A
1
HHHHHHGGASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVP...
seq_ecae2105c114f891ff4a7502
[ "1" ]
ELECTRON MICROSCOPY
3
2026-05-27
0.878721
1
core
seq_bb3a0a9b067359c4dba1d607
struct_f388146ed7cea03a
component_3f8b289bd5ed90ed
train
4
10es_A
End of preview. Expand in Data Studio

PDB-Chain-Complex-Benchmark-Rigor

Rigor rebuild of Synthyra/PDB-Chain-Complex-Benchmark with split assignments recomputed from the published chain and complex parquet artifacts.

Split Policy

Splits are assigned by connected components over exact sequence, sequence hash, 30% sequence cluster, structure cluster, source split component, same-PDB asymmetric-unit membership, chain assembly membership, and biological assembly co-membership from the complex rows. The target is 90/5/5 by component count.

The rebuild hard-fails before upload if any chain or complex member leaks across train, validation, and test by chain UID, sequence, sequence hash, 30% sequence cluster, structure cluster, or recomputed split component.

Complex list-valued payload columns are regenerated from the chain table during the rebuild, then asserted directly from the emitted payloads, including asymmetric_unit_chain_uids.

After writing parquet, the builder reloads the emitted chain and complex shards and reruns split-routing, payload-consistency, and disjointness checks from the serialized files.

This artifact-only rebuild does not rerun Foldseek or MMseqs2. It enforces and verifies the published cluster labels plus optional external sequence verification edges when supplied.

Build Metadata

{
  "batch_size": 16384,
  "chain_scan": {
    "assembly_membership_edges_seen": 1138910,
    "asymmetric_unit_membership_edges_seen": 1069448,
    "chains_scanned": 1069448
  },
  "chain_write": {
    "file_counts": {
      "test": 1,
      "train": 22,
      "valid": 1
    },
    "row_counts": {
      "test": 334,
      "train": 1068780,
      "valid": 334
    }
  },
  "complex_edge_scan": {
    "complex_member_edges_seen": 775327,
    "complexes_scanned_for_edges": 363583
  },
  "complex_write": {
    "file_counts": {
      "test": 1,
      "train": 8,
      "valid": 1
    },
    "member_chain_rows": 1138910,
    "member_fields": {
      "asymmetric_unit_chain_uids": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 1069448
      },
      "chain_uid": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 1069448
      },
      "sequence_clusters_30": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 48857
      },
      "sequence_hashes": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 183467
      },
      "sequences": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 183467
      },
      "split_components": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 6684
      },
      "structure_clusters": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 66989
      }
    },
    "row_counts": {
      "test": 335,
      "train": 362909,
      "valid": 339
    }
  },
  "component_stats": {
    "split_component_count": 6684,
    "test_component_count": 334,
    "train_component_count": 6016,
    "valid_component_count": 334
  },
  "cpu_count": 32,
  "elapsed_seconds": 75.866,
  "foldseek_path": "",
  "include_source_split_component_edges": true,
  "max_rows_per_shard": 50000,
  "mmseqs_path": "",
  "nvidia-smi_path": "C:\\Windows\\system32\\nvidia-smi.EXE",
  "nvidia-smi_version": "Tue Jun 30 18:02:49 2026       \n+-----------------------------------------------------------------------------------------+\n| NVIDIA-SMI 580.88                 Driver Version: 580.88         CUDA Version: 13.0     |\n+-----------------------------------------+------------------------+----------------------+\n| GPU  Name                  Driver-Model | Bus-Id          Disp.A | Volatile Uncorr. ECC |\n| Fan  Temp   Perf          Pwr:Usage/Cap |           Memory-Usage | GPU-Util  Compute M. |\n|                                         |                        |               MIG M. |\n|=========================================+========================+======================|\n|   0  NVIDIA GeForce RTX 4070 ...  WDDM  |   00000000:01:00.0  On |                  N/A |\n| N/A   41C    P8              6W /  121W |     984MiB /   8188MiB |     10%      Default |\n|                                         |                        |                  N/A |\n+-----------------------------------------+------------------------+----------------------+\n\n+-----------------------------------------------------------------------------------------+\n| Processes:                                                                              |\n|  GPU   GI   CI              PID   Type   Process name                        GPU Memory |\n|        ID   ID                                                               Usage      |\n|=========================================================================================|\n|    0   N/A  N/A            8844    C+G   ...indows\\System32\\ShellHost.exe      N/A      |\n|    0   N/A  N/A           10456    C+G   ..._cw5n1h2txyewy\\SearchHost.exe      N/A      |\n|    0   N/A  N/A           13212    C+G   ...5n1h2txyewy\\TextInputHost.exe      N/A      |\n|    0   N/A  N/A           36048    C+G   ...Chrome\\Application\\chrome.exe      N/A      |\n|    0   N/A  N/A           41088    C+G   ...ntrolPanel\\SystemSettings.exe      N/A      |\n|    0   N/A  N/A           63696    C+G   ...8bbwe\\PhoneExperienceHost.exe      N/A      |\n|    0   N/A  N/A           72372    C+G   ...y\\StartMenuExperienceHost.exe      N/A      |\n|    0   N/A  N/A           84244    C+G   ...xyewy\\ShellExperienceHost.exe      N/A      |\n|    0   N/A  N/A          104536    C+G   C:\\Windows\\explorer.exe               N/A      |\n|    0   N/A  N/A          152648    C+G   ....0.4022.80\\msedgewebview2.exe      N/A      |\n|    0   N/A  N/A          152984    C+G   ...e Experience\\NVIDIA Share.exe      N/A      |\n|    0   N/A  N/A          155976    C+G   ...em32\\ApplicationFrameHost.exe      N/A      |\n|    0   N/A  N/A          162800    C+G   ...p\\app-3.6.1\\GitHubDesktop.exe      N/A      |\n|    0   N/A  N/A          196292    C+G   ...Chrome\\Application\\chrome.exe      N/A      |\n|    0   N/A  N/A          198076    C+G   ...__2p2nqsd0c76g0\\app\\Codex.exe      N/A      |\n|    0   N/A  N/A          206536    C+G   ...2txyewy\\CrossDeviceResume.exe      N/A      |\n|    0   N/A  N/A          221536    C+G   ...Files\\Notepad++\\notepad++.exe      N/A      |\n+-----------------------------------------------------------------------------------------+",
  "platform": "Windows-11-10.0.26200-SP0",
  "python": "3.12.13",
  "seed": 42,
  "sequence_verification_max_unknown_fraction": 0.0,
  "source_chain_rows": 1069448,
  "source_complex_rows": 363583,
  "source_repo_id": "Synthyra/PDB-Chain-Complex-Benchmark",
  "source_snapshot_dir": "C:\\tmp\\hf_pdb_chain_complex_cache\\datasets--Synthyra--PDB-Chain-Complex-Benchmark\\snapshots\\3eb55ee7289dfedfbddf0cde48b68c5395783ccf",
  "target_repo_id": "Synthyra/PDB-Chain-Complex-Benchmark-Rigor",
  "test_frac": 0.05,
  "valid_frac": 0.05
}

Leakage Assertions

{
  "chains": {
    "fields": {
      "chain_uid": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 1069448
      },
      "seqs": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 183467
      },
      "sequence_cluster_30": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 48857
      },
      "sequence_hash": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 183467
      },
      "split_component": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 6684
      },
      "structure_cluster": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 66989
      }
    },
    "post_write": {
      "fields": {
        "chain_uid": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 1069448
        },
        "seqs": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 183467
        },
        "sequence_cluster_30": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 48857
        },
        "sequence_hash": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 183467
        },
        "split_component": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 6684
        },
        "structure_cluster": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 66989
        }
      },
      "rows": 1069448,
      "split_counts": {
        "test": 334,
        "train": 1068780,
        "valid": 334
      }
    },
    "rows": 1069448,
    "sequence_verification_edges": {
      "checked_edges": 0,
      "cross_split_edges": 0,
      "provided": false,
      "skipped_self_edges": 0,
      "skipped_unknown_edges": 0,
      "total_edges": 0
    },
    "split_counts": {
      "test": 334,
      "train": 1068780,
      "valid": 334
    }
  },
  "complexes": {
    "member_chain_rows": 1138910,
    "member_fields": {
      "asymmetric_unit_chain_uids": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 1069448
      },
      "chain_uid": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 1069448
      },
      "sequence_clusters_30": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 48857
      },
      "sequence_hashes": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 183467
      },
      "sequences": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 183467
      },
      "split_components": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 6684
      },
      "structure_clusters": {
        "crossing_values": 0,
        "max_pairwise_overlap": 0,
        "unique_values": 66989
      }
    },
    "member_split_consistency": "passed",
    "payload_columns_regenerated_from_chains": true,
    "post_write": {
      "asymmetric_unit_chain_rows": 1760175,
      "member_chain_rows": 1138910,
      "member_fields": {
        "asymmetric_unit_chain_uids": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 1069448
        },
        "chain_uid": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 1069448
        },
        "sequence_clusters_30": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 48857
        },
        "sequence_hashes": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 183467
        },
        "sequences": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 183467
        },
        "split_components": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 6684
        },
        "structure_clusters": {
          "crossing_values": 0,
          "max_pairwise_overlap": 0,
          "unique_values": 66989
        }
      },
      "payload_columns_match_chain_rows": true,
      "rows": 363583,
      "shard_split_routing": "passed",
      "split_counts": {
        "test": 335,
        "train": 362909,
        "valid": 339
      }
    },
    "rows": 363583,
    "split_counts": {
      "test": 335,
      "train": 362909,
      "valid": 339
    }
  }
}
Downloads last month
11