chain_uid stringlengths 6 8 | pdb_id stringlengths 4 4 | label_asym_id stringlengths 1 3 | auth_asym_id stringlengths 1 4 | entity_id stringclasses 165
values | seqs stringlengths 2 8.57k | sequence_hash stringlengths 28 28 | assembly_ids listlengths 1 11 | method stringclasses 10
values | resolution float64 0.48 70 ⌀ | release_date stringdate 1976-05-19 00:00:00 2026-06-24 00:00:00 | observed_ca_fraction float64 0 1 | standard_aa_fraction float64 0 1 | quality_tier stringclasses 3
values | sequence_cluster_30 stringlengths 28 28 | structure_cluster stringlengths 23 23 | split_component stringlengths 26 26 | split stringclasses 1
value | member_count int64 1 2.58k | representative_chain_id stringlengths 6 8 |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
7dvd_E | 7dvd | E | E | 2 | EIGAQLRRMADDLNA | seq_49f56b636a9463f8200600e1 | [
"5"
] | X-RAY DIFFRACTION | 2.59 | 2021-08-04 | 1 | 1 | low_quality | seq_49f56b636a9463f8200600e1 | struct_def5dbf48fc302c7 | component_3f8b289bd5ed90ed | train | 1 | 7dvd_E |
8gjs_B | 8gjs | B | B | 2 | XLTFXEYWAQLLAAAAAA | seq_2972d14d2f2affdb3144697f | [
"2"
] | X-RAY DIFFRACTION | 1.56 | 2023-07-26 | 0.777778 | 0.888889 | low_quality | seq_2972d14d2f2affdb3144697f | struct_ccd94f698c695660 | component_3f8b289bd5ed90ed | train | 1 | 8gjs_B |
4l67_B | 4l67 | B | B | 2 | PRQWQSLIEESARRPKPLVDPACIT | seq_8179aa95dfe8ad8bd08a0a39 | [
"2"
] | X-RAY DIFFRACTION | 2.8 | 2013-08-14 | 0.8 | 1 | extended | seq_8179aa95dfe8ad8bd08a0a39 | struct_840cb6d92eeb5ccf | component_3f8b289bd5ed90ed | train | 1 | 4l67_B |
2z5n_B | 2z5n | B | B | 2 | YSNQQSGYGKVSRRGGHQNSYKPY | seq_9dc99e7323a4e28e2df0652f | [
"2"
] | X-RAY DIFFRACTION | 3.2 | 2007-10-23 | 0.625 | 1 | extended | seq_9dc99e7323a4e28e2df0652f | struct_ee0d809a4bdd95b3 | component_3f8b289bd5ed90ed | train | 1 | 2z5n_B |
200l_A | 200l | A | A | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMAQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_6642496e01888363cfbe50c9 | [
"1"
] | X-RAY DIFFRACTION | 1.95 | 1996-03-08 | 0.987805 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 4 | 200l_A |
101m_A | 101m | A | A | 1 | MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRVKHLKTEAEMKASEDLKKHGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG | seq_d252e12ea80505784e26ecbf | [
"1"
] | X-RAY DIFFRACTION | 2.07 | 1998-04-08 | 1 | 1 | core | seq_fb0ff316e972937b8152db3a | struct_e448a8132443a193 | component_3f8b289bd5ed90ed | train | 4 | 1mym_A |
201l_A | 201l | A | A | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKHPAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_0533b597b5311f6a56b83d92 | [
"1"
] | X-RAY DIFFRACTION | 2 | 1994-01-31 | 0.987952 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 2 | 201l_B |
201l_B | 201l | B | B | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKHPAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_0533b597b5311f6a56b83d92 | [
"2"
] | X-RAY DIFFRACTION | 2 | 1994-01-31 | 1 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 2 | 201l_B |
102l_A | 102l | A | A | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAAKSELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_ef78343c5b60c127a98f1d12 | [
"1"
] | X-RAY DIFFRACTION | 1.74 | 1993-10-31 | 0.987879 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 1 | 102l_A |
102m_A | 102m | A | A | 1 | MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKAGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG | seq_7762da8704b65f9798e48420 | [
"1"
] | X-RAY DIFFRACTION | 1.84 | 1998-04-08 | 1 | 1 | core | seq_fb0ff316e972937b8152db3a | struct_e448a8132443a193 | component_3f8b289bd5ed90ed | train | 12 | 5ilm_A |
103l_A | 103l | A | A | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNSLDAAKSELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_93fee99256cf88732db6022f | [
"1"
] | X-RAY DIFFRACTION | 1.9 | 1993-10-31 | 0.952096 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 1 | 103l_A |
103m_A | 103m | A | A | 1 | MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKAGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG | seq_7762da8704b65f9798e48420 | [
"1"
] | X-RAY DIFFRACTION | 2.07 | 1998-04-08 | 1 | 1 | core | seq_fb0ff316e972937b8152db3a | struct_e448a8132443a193 | component_3f8b289bd5ed90ed | train | 12 | 5ilm_A |
104l_A | 104l | A | A | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSAAELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_29581997a20b78f493653784 | [
"1"
] | X-RAY DIFFRACTION | 2.8 | 1993-10-31 | 0.987952 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 2 | 104l_A |
104l_B | 104l | B | B | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSAAELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_29581997a20b78f493653784 | [
"2"
] | X-RAY DIFFRACTION | 2.8 | 1993-10-31 | 0.987952 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 2 | 104l_A |
104m_A | 104m | A | A | 1 | VLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGDFGADAQGAMNKALELFRKDIAAKYKELGYQG | seq_4e1e5bdd96abfd0c314159fd | [
"1"
] | X-RAY DIFFRACTION | 1.71 | 1998-04-08 | 1 | 1 | core | seq_fb0ff316e972937b8152db3a | struct_e448a8132443a193 | component_3f8b289bd5ed90ed | train | 82 | 2ekt_A |
105m_A | 105m | A | A | 1 | VLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGDFGADAQGAMNKALELFRKDIAAKYKELGYQG | seq_4e1e5bdd96abfd0c314159fd | [
"1"
] | X-RAY DIFFRACTION | 2.02 | 1998-04-08 | 1 | 1 | core | seq_fb0ff316e972937b8152db3a | struct_e448a8132443a193 | component_3f8b289bd5ed90ed | train | 82 | 2ekt_A |
205l_A | 205l | A | A | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSAAAELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_165b1a0fba32e47f2770d46d | [
"1"
] | X-RAY DIFFRACTION | 2.1 | 1994-01-31 | 0.952096 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 1 | 205l_A |
106m_A | 106m | A | A | 1 | MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTFLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG | seq_efeee66808c25d1bd8c64d00 | [
"1"
] | X-RAY DIFFRACTION | 1.99 | 1998-04-08 | 1 | 1 | core | seq_fb0ff316e972937b8152db3a | struct_e448a8132443a193 | component_3f8b289bd5ed90ed | train | 6 | 1mll_A |
206l_A | 206l | A | A | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNASKSELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_56f25cb14e837a305e73f7fa | [
"1"
] | X-RAY DIFFRACTION | 1.75 | 1996-08-17 | 0.987805 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 1 | 206l_A |
107l_A | 107l | A | A | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKGELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_05bad0eeac35d610558735c1 | [
"1"
] | X-RAY DIFFRACTION | 1.8 | 1993-10-31 | 0.987805 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 1 | 107l_A |
107m_A | 107m | A | A | 1 | MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTFLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG | seq_efeee66808c25d1bd8c64d00 | [
"1"
] | X-RAY DIFFRACTION | 2.09 | 1998-04-08 | 1 | 1 | core | seq_fb0ff316e972937b8152db3a | struct_e448a8132443a193 | component_3f8b289bd5ed90ed | train | 6 | 1mll_A |
207l_A | 207l | A | A | 1 | KVFERCELARTLKRLGMDGYRGISLANWMCLAKWESGYNTRATNYNAGDRSTDYGIFQINSRYWCNDGKTPGAVNAAHLSCSALLQDNIADAVACAKRVVRDPQGIRAWVAWRNRCQNRDVRQYVQGCGV | seq_0b1f7f2773d6dc1237cb7460 | [
"1"
] | X-RAY DIFFRACTION | 1.75 | 1996-10-14 | 1 | 1 | core | seq_1b6af75dd3c91cecedd7194a | struct_af742d4f61faba4f | component_3f8b289bd5ed90ed | train | 4 | 207l_A |
108l_A | 108l | A | A | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKIELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_381e137b01eb744dea5516de | [
"1"
] | X-RAY DIFFRACTION | 1.8 | 1993-10-31 | 0.987805 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 1 | 108l_A |
108m_A | 108m | A | A | 1 | MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTFLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG | seq_efeee66808c25d1bd8c64d00 | [
"1"
] | X-RAY DIFFRACTION | 2.67 | 1998-05-20 | 1 | 1 | core | seq_fb0ff316e972937b8152db3a | struct_e448a8132443a193 | component_3f8b289bd5ed90ed | train | 6 | 1mll_A |
208l_A | 208l | A | A | 1 | KVFERCELARTLKRLGMDGYRGISLANWMCLAKWESGYNTRATNYNAGDRSTDYGIFQINSRYWCNDGKTPGAVNAAHLSCSALLQDNIADAVACAKRVVRDPQGIRAWVAWRNRCQNRDVRQYVQGCGV | seq_0b1f7f2773d6dc1237cb7460 | [
"1"
] | X-RAY DIFFRACTION | 1.8 | 1996-10-14 | 1 | 1 | core | seq_1b6af75dd3c91cecedd7194a | struct_af742d4f61faba4f | component_3f8b289bd5ed90ed | train | 4 | 207l_A |
109l_A | 109l | A | A | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKKELDKAIGRNTNGVITKDEAEKLFNQDVDAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_26be00d0f75767c685201906 | [
"1"
] | X-RAY DIFFRACTION | 1.85 | 1993-10-31 | 0.987805 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 1 | 109l_A |
109m_A | 109m | A | A | 1 | MVLSEGEWQLVLHVWAKVEADVAGHGQDILIRLFKSHPETLEKFDRFKHLKTEAEMKASEDLKKHGVTVLTALGAILKKKGHHEAELKPLAQSHATKHKIPIKYLEFISEAIIHVLHSRHPGNFGADAQGAMNKALELFRKDIAAKYKELGYQG | seq_7068ee572ee196e373d3371a | [
"1"
] | X-RAY DIFFRACTION | 1.83 | 1998-04-08 | 1 | 1 | core | seq_fb0ff316e972937b8152db3a | struct_e448a8132443a193 | component_3f8b289bd5ed90ed | train | 26 | 1jw8_A |
209d_C | 209d | C | C | 2 | TVPGVXTVPGV | seq_f1490965ba1401b8776ff444 | [
"1"
] | X-RAY DIFFRACTION | 3 | 1995-10-15 | 0.363636 | 0.909091 | low_quality | seq_f1490965ba1401b8776ff444 | struct_8d2f10f4b300c5e6 | component_3f8b289bd5ed90ed | train | 59 | 1qfi_A |
209l_A | 209l | A | A | 1 | MNIFEMLRIDEGLRLKIYKDTEGYYTIGIGHLLTKSPSLNAAKSELDKAIGRNTNGVITKDEAEKLFNQDVDAAAAAVRGILRNAKLKPVYDSLDAVRRAALINMVFQMGETGVAGFTNSLRMLQQKRWDEAAVNLAKSRWYNQTPNRAKRVITTFRTGTWDAYKNL | seq_be5b777b7a3781b22a595b9d | [
"1"
] | X-RAY DIFFRACTION | 2.7 | 1996-12-23 | 0.988024 | 1 | core | seq_431e4645a02f8a5bc01ebc6b | struct_519869b66e394cbb | component_3f8b289bd5ed90ed | train | 1 | 209l_A |
10ad_A | 10ad | A | E | 1 | MDALIIPVTMEVPCDSRGQRMWWAFLASSMVTFFGGLFIILLWRTLKYLWTVCCHCGGKTKEAQKINNGSSQADGTLKPVDEKEEAVAAEVGWMTSVKDWAGVMISAQTLTGRVLVVLVFALSIGALVIYFIDSSNPIESCQNFYKDFTLQIDMAFNVFFLLYFGLRFIAANDKLWFWLEVNSVVDFFTVPPVFVSVYLNRSWLGLRFLRALRLIQFSEILQFLNILKTSNSIKLVNLLSIFISTWLTAAGFIHLVENSGDPWENFQNNQALTYWECVYLLMVTMSTVGYGDVYAKTTLGRLFMVFFILGGLAMFASYVP... | seq_b48877120660dd28bb133cdd | [
"1"
] | ELECTRON MICROSCOPY | 3.44 | 2026-02-04 | 0.785265 | 1 | extended | seq_088fe509fecb2499d15f55d5 | struct_ccfd713d07f16c59 | component_3f8b289bd5ed90ed | train | 4 | 10ad_A |
10ad_B | 10ad | B | C | 1 | MDALIIPVTMEVPCDSRGQRMWWAFLASSMVTFFGGLFIILLWRTLKYLWTVCCHCGGKTKEAQKINNGSSQADGTLKPVDEKEEAVAAEVGWMTSVKDWAGVMISAQTLTGRVLVVLVFALSIGALVIYFIDSSNPIESCQNFYKDFTLQIDMAFNVFFLLYFGLRFIAANDKLWFWLEVNSVVDFFTVPPVFVSVYLNRSWLGLRFLRALRLIQFSEILQFLNILKTSNSIKLVNLLSIFISTWLTAAGFIHLVENSGDPWENFQNNQALTYWECVYLLMVTMSTVGYGDVYAKTTLGRLFMVFFILGGLAMFASYVP... | seq_b48877120660dd28bb133cdd | [
"1"
] | ELECTRON MICROSCOPY | 3.44 | 2026-02-04 | 0.785265 | 1 | extended | seq_088fe509fecb2499d15f55d5 | struct_ccfd713d07f16c59 | component_3f8b289bd5ed90ed | train | 4 | 10ad_A |
10ad_C | 10ad | C | D | 1 | MDALIIPVTMEVPCDSRGQRMWWAFLASSMVTFFGGLFIILLWRTLKYLWTVCCHCGGKTKEAQKINNGSSQADGTLKPVDEKEEAVAAEVGWMTSVKDWAGVMISAQTLTGRVLVVLVFALSIGALVIYFIDSSNPIESCQNFYKDFTLQIDMAFNVFFLLYFGLRFIAANDKLWFWLEVNSVVDFFTVPPVFVSVYLNRSWLGLRFLRALRLIQFSEILQFLNILKTSNSIKLVNLLSIFISTWLTAAGFIHLVENSGDPWENFQNNQALTYWECVYLLMVTMSTVGYGDVYAKTTLGRLFMVFFILGGLAMFASYVP... | seq_b48877120660dd28bb133cdd | [
"1"
] | ELECTRON MICROSCOPY | 3.44 | 2026-02-04 | 0.785265 | 1 | extended | seq_088fe509fecb2499d15f55d5 | struct_ccfd713d07f16c59 | component_3f8b289bd5ed90ed | train | 4 | 10ad_A |
10ad_D | 10ad | D | A | 1 | MDALIIPVTMEVPCDSRGQRMWWAFLASSMVTFFGGLFIILLWRTLKYLWTVCCHCGGKTKEAQKINNGSSQADGTLKPVDEKEEAVAAEVGWMTSVKDWAGVMISAQTLTGRVLVVLVFALSIGALVIYFIDSSNPIESCQNFYKDFTLQIDMAFNVFFLLYFGLRFIAANDKLWFWLEVNSVVDFFTVPPVFVSVYLNRSWLGLRFLRALRLIQFSEILQFLNILKTSNSIKLVNLLSIFISTWLTAAGFIHLVENSGDPWENFQNNQALTYWECVYLLMVTMSTVGYGDVYAKTTLGRLFMVFFILGGLAMFASYVP... | seq_b48877120660dd28bb133cdd | [
"1"
] | ELECTRON MICROSCOPY | 3.44 | 2026-02-04 | 0.785265 | 1 | extended | seq_088fe509fecb2499d15f55d5 | struct_ccfd713d07f16c59 | component_3f8b289bd5ed90ed | train | 4 | 10ad_A |
10af_A | 10af | A | A | 1 | MAHHHHHHMSRPHVFFDITIGGSNAGRIVMELFADIVPKTAENFRCLCTGERGMGRSGKKLHYKGSKFHRVIPNFMLQGGDFTRGNGTGGESIYGEKFPDENFQEKHTGPGVLSMANAGPNTNGSQFFICTAKTEWLDGKHVVFGRVVEGMNVVKAVESKGSQSGRTSADIVIADCGQL | seq_a1f700ab62fc9048d6c89952 | [
"1"
] | X-RAY DIFFRACTION | 1.25 | 2026-01-21 | 0.949721 | 1 | core | seq_639d20e1b4c5fd1474620f19 | struct_5c276d9f03a7be39 | component_3f8b289bd5ed90ed | train | 1 | 10af_A |
10ah_A | 10ah | A | A | 1 | SNAGGSSPITGLVYDQRMMLHHNMWDSHHPELPQRISRIFSRHEELRLLSRCHRIPARLATEEELALCHSSKHISIIKSSEHMKPRDLNRLGDEYDSIFISNESYTCALLAAGSCFNSAQAILTGQVRNAVAIVRPPGHHAEKDTACGFCFFNTAALTARYAQSITRESLRVLIVDWDVHHGNGTQHIFEEDDSVLYISLHRYEDGAFFPNSEDANYDKVGLGKGRGYNVNIPWNGGKMGDPEYMAAFHHLVMPIAREFAPELVLVSAGFDAARGDPLGGFQVTPEGYAHLTHQLMSLAAGRVLIILEGGYNLTSISESM... | seq_be307890dd23905f77cdfafa | [
"1"
] | X-RAY DIFFRACTION | 2.2 | 2026-06-17 | 0.978022 | 1 | core | seq_cfa6024209130a23601f5d2d | struct_1aaf3c4c36263840 | component_3f8b289bd5ed90ed | train | 4 | 10ai_A |
10ah_B | 10ah | B | B | 1 | SNAGGSSPITGLVYDQRMMLHHNMWDSHHPELPQRISRIFSRHEELRLLSRCHRIPARLATEEELALCHSSKHISIIKSSEHMKPRDLNRLGDEYDSIFISNESYTCALLAAGSCFNSAQAILTGQVRNAVAIVRPPGHHAEKDTACGFCFFNTAALTARYAQSITRESLRVLIVDWDVHHGNGTQHIFEEDDSVLYISLHRYEDGAFFPNSEDANYDKVGLGKGRGYNVNIPWNGGKMGDPEYMAAFHHLVMPIAREFAPELVLVSAGFDAARGDPLGGFQVTPEGYAHLTHQLMSLAAGRVLIILEGGYNLTSISESM... | seq_be307890dd23905f77cdfafa | [
"2"
] | X-RAY DIFFRACTION | 2.2 | 2026-06-17 | 0.978022 | 1 | core | seq_cfa6024209130a23601f5d2d | struct_1aaf3c4c36263840 | component_3f8b289bd5ed90ed | train | 4 | 10ai_A |
10ai_A | 10ai | A | A | 1 | SNAGGSSPITGLVYDQRMMLHHNMWDSHHPELPQRISRIFSRHEELRLLSRCHRIPARLATEEELALCHSSKHISIIKSSEHMKPRDLNRLGDEYDSIFISNESYTCALLAAGSCFNSAQAILTGQVRNAVAIVRPPGHHAEKDTACGFCFFNTAALTARYAQSITRESLRVLIVDWDVHHGNGTQHIFEEDDSVLYISLHRYEDGAFFPNSEDANYDKVGLGKGRGYNVNIPWNGGKMGDPEYMAAFHHLVMPIAREFAPELVLVSAGFDAARGDPLGGFQVTPEGYAHLTHQLMSLAAGRVLIILEGGYNLTSISESM... | seq_be307890dd23905f77cdfafa | [
"1"
] | X-RAY DIFFRACTION | 2.1 | 2026-06-17 | 0.978022 | 1 | core | seq_cfa6024209130a23601f5d2d | struct_1aaf3c4c36263840 | component_3f8b289bd5ed90ed | train | 4 | 10ai_A |
10ai_B | 10ai | B | B | 1 | SNAGGSSPITGLVYDQRMMLHHNMWDSHHPELPQRISRIFSRHEELRLLSRCHRIPARLATEEELALCHSSKHISIIKSSEHMKPRDLNRLGDEYDSIFISNESYTCALLAAGSCFNSAQAILTGQVRNAVAIVRPPGHHAEKDTACGFCFFNTAALTARYAQSITRESLRVLIVDWDVHHGNGTQHIFEEDDSVLYISLHRYEDGAFFPNSEDANYDKVGLGKGRGYNVNIPWNGGKMGDPEYMAAFHHLVMPIAREFAPELVLVSAGFDAARGDPLGGFQVTPEGYAHLTHQLMSLAAGRVLIILEGGYNLTSISESM... | seq_be307890dd23905f77cdfafa | [
"2"
] | X-RAY DIFFRACTION | 2.1 | 2026-06-17 | 0.978022 | 1 | core | seq_cfa6024209130a23601f5d2d | struct_1aaf3c4c36263840 | component_3f8b289bd5ed90ed | train | 4 | 10ai_A |
10aj_A | 10aj | A | A | 1 | EGEEDDDKDFLWPAPNEEQVTCLKMYFGHSSFKPVQWKVIHSVLEERRDNVAVMATGYGKSLCFQYPPVYVGKIGLVISPLISLMEDQVLQLKMSNIPACFLGSAQSENVLTDIKLGKYRIVYVTPEYCSGNMGLLQQLEADIGITLIAVDEAHCISEWGHDFRDSFRKLGSLKTALPMVPIVALTATASSSIREDIVRCLNLRNPQITCTGFDRPNLYLEVRRKTGNILQDLQPFLVKTSSHWEFEGPTIIYCPSRKMTQQVTGELRKLNLSCGTYHAGMSFSTRKDIHHRFVRDEIQCVIATIAFGMGINKADIRQVI... | seq_969b6ab0389096c0ca7d14c4 | [
"1"
] | X-RAY DIFFRACTION | 2.42 | 2026-05-13 | 0.981352 | 1 | core | seq_6b5dc3d2f02938658e1ad124 | struct_7c2bc6b12135584b | component_3f8b289bd5ed90ed | train | 1 | 10aj_A |
10ak_A | 10ak | A | A | 1 | ANEGEEDDDKDFLWPAPNEEQVTCLKMYFGHSSFKPVQWKVIHSVLEERRDNVAVMATGYGKSLCFQYPPVYVGKIGLVISPLISLMEDQVLQLKMSNIPACFLGSAQSENVLTDIKLGKYRIVYVTPEYCSGNMGLLQQLEADIGITLIAVDEAHCISEWGHDFRDSFRKLGSLKTALPMVPIVALTATASSSIREDIVRCLNLRNPQITCTGFDRPNLYLEVRRKTGNILQDLQPFLVKTSSHWEFEGPTIIYCPSRKMTQQVTGELRKLNLSCGTYHAGMSFSTRKDIHHRFVRDEIQCVIATIAFGMGINKADIRQ... | seq_e98bb0f99dbe86d18f6abe12 | [
"1"
] | X-RAY DIFFRACTION | 1.368 | 2026-05-13 | 0.981439 | 1 | core | seq_6b5dc3d2f02938658e1ad124 | struct_7c2bc6b12135584b | component_3f8b289bd5ed90ed | train | 1 | 10ak_A |
10ap_A | 10ap | A | A | 1 | NLGLPTKEEEEDDENEANEGEEDDDKDFLWPAPNEEQVTCLKMYFGHSSFKPVQWKVIHSVLEERRDNVAVMATGYGKSLCFQYPPVYVGKIGLVISPLISLMEDQVLQLKMSNIPACFLGSAQSENVLTDIKLGKYRIVYVTPEYCSGNMGLLQQLEADIGITLIAVDEAHCISEWGHDFRDSFRKLGSLKTALPMVPIVALTATASSSIREDIVRCLNLRNPQITCTGFDRPNLYLEVRRKTGNILQDLQPFLVKTSSHWEFEGPTIIYCPSRKMTQQVTGELRKLNLSCGTYHAGMSFSTRKDIHHRFVRDEIQCVI... | seq_25ac36d46f06caa0a785c928 | [
"1"
] | X-RAY DIFFRACTION | 2.58 | 2026-05-13 | 0.941834 | 1 | core | seq_6b5dc3d2f02938658e1ad124 | struct_7c2bc6b12135584b | component_3f8b289bd5ed90ed | train | 1 | 10ap_A |
10ay_A | 10ay | A | A | 1 | GKPPQRSIDKPFRLCVSDVFKDQGSGFCITGKIEAGYIQTGDRLLAMPPNETCTVKGITLHDEPVDWAAAGDHVSLTLVGMDIIKINVGCIFCGPKVPIKACTRFRARILIFNIEIPITKGFPVLLHYQTVSEPAVIKRLISVLNKSTGEVTKKKPKFLTKGQNALVELQTQRPIALELYKDFKELGRFMLRYGGSTIAAGVVTEIKE | seq_caa15a978f7aecfe1173252e | [
"1"
] | ELECTRON MICROSCOPY | 2.9 | 2026-04-22 | 0.480769 | 1 | low_quality | seq_2a3a0c3d94c6dfb72d13aa27 | struct_4b2f87d2128982a9 | component_3f8b289bd5ed90ed | train | 4 | 11mr_A |
10ay_B | 10ay | B | B | 2 | GEAKKPNIINFDTSLPTSHTYLGADMEEFHGRTLHDDDSCQVIPVLPQVMMILIPGQTLPLQLFHPQEVSMVRNLIQKDRTFAVLAYSNVQEREAQFGTTAEIYAYREEQDFGIEIVKVKAIGRQRFKVLELRTQSDGIQQAKVQILPECVLPSTMSAVQLESLNKCQIFPSKPVSREDQCSYKWWQKYQKRKFHCANLTSWPRWLYSLYDAETLMDRIKKQLREWDENLKDDSLPSNPIDFSYRVAACLPIDDVLRIQLLKIGSAIQRLRCELDIMNKCTSLCCKQCQETEITTKNEIFSLSLCGPMAAYVNPHGYVHE... | seq_37b13dc80e4e5a333356c5b3 | [
"1"
] | ELECTRON MICROSCOPY | 2.9 | 2026-04-22 | 0.943069 | 1 | core | seq_c3f3cae45b879e67d691f7f2 | struct_0662d7fab350333a | component_3f8b289bd5ed90ed | train | 4 | 11mr_B |
10ay_C | 10ay | C | C | 3 | MSYNYVVTAQKPTAVNGCVTGHFTSAEDLNLLIAKNTRLEIYVVTAEGLRPVKEVGMYGKIAVMELFRPKGESKDLLFILTAKYNACILEYKQSGESIDIITRAHGNVQDRIGRPSETGIIGIIDPECRMIGLRLYDGLFKVIPLDRDNKELKAFNIRLEELHVIDVKFLYGCQAPTICFVYQDPQGRHVKTYEVSLREKEFNKGPWKQENVEAEASMVIAVPEPFGGAIIIGQESITYHNGDKYLAIAPPIIKQSTIVCHNRVDPNGSRYLLGDMEGRLFMLLLEKEEQMDGTVTLKDLRVELLGETSIAECLTYLDNG... | seq_80be356aef4f71329822694d | [
"1"
] | ELECTRON MICROSCOPY | 2.9 | 2026-04-22 | 0.687719 | 1 | extended | seq_0b1744cbd74dc2a14a5c400a | struct_a8a537e9c54fb73b | component_3f8b289bd5ed90ed | train | 75 | 3e0c_A |
10ay_D | 10ay | D | D | 1 | GKPPQRSIDKPFRLCVSDVFKDQGSGFCITGKIEAGYIQTGDRLLAMPPNETCTVKGITLHDEPVDWAAAGDHVSLTLVGMDIIKINVGCIFCGPKVPIKACTRFRARILIFNIEIPITKGFPVLLHYQTVSEPAVIKRLISVLNKSTGEVTKKKPKFLTKGQNALVELQTQRPIALELYKDFKELGRFMLRYGGSTIAAGVVTEIKE | seq_caa15a978f7aecfe1173252e | [
"1"
] | ELECTRON MICROSCOPY | 2.9 | 2026-04-22 | 0.461538 | 1 | low_quality | seq_2a3a0c3d94c6dfb72d13aa27 | struct_4b2f87d2128982a9 | component_3f8b289bd5ed90ed | train | 4 | 11mr_A |
10ay_E | 10ay | E | E | 2 | GEAKKPNIINFDTSLPTSHTYLGADMEEFHGRTLHDDDSCQVIPVLPQVMMILIPGQTLPLQLFHPQEVSMVRNLIQKDRTFAVLAYSNVQEREAQFGTTAEIYAYREEQDFGIEIVKVKAIGRQRFKVLELRTQSDGIQQAKVQILPECVLPSTMSAVQLESLNKCQIFPSKPVSREDQCSYKWWQKYQKRKFHCANLTSWPRWLYSLYDAETLMDRIKKQLREWDENLKDDSLPSNPIDFSYRVAACLPIDDVLRIQLLKIGSAIQRLRCELDIMNKCTSLCCKQCQETEITTKNEIFSLSLCGPMAAYVNPHGYVHE... | seq_37b13dc80e4e5a333356c5b3 | [
"1"
] | ELECTRON MICROSCOPY | 2.9 | 2026-04-22 | 0.943069 | 1 | core | seq_c3f3cae45b879e67d691f7f2 | struct_0662d7fab350333a | component_3f8b289bd5ed90ed | train | 4 | 11mr_B |
10ay_F | 10ay | F | F | 3 | MSYNYVVTAQKPTAVNGCVTGHFTSAEDLNLLIAKNTRLEIYVVTAEGLRPVKEVGMYGKIAVMELFRPKGESKDLLFILTAKYNACILEYKQSGESIDIITRAHGNVQDRIGRPSETGIIGIIDPECRMIGLRLYDGLFKVIPLDRDNKELKAFNIRLEELHVIDVKFLYGCQAPTICFVYQDPQGRHVKTYEVSLREKEFNKGPWKQENVEAEASMVIAVPEPFGGAIIIGQESITYHNGDKYLAIAPPIIKQSTIVCHNRVDPNGSRYLLGDMEGRLFMLLLEKEEQMDGTVTLKDLRVELLGETSIAECLTYLDNG... | seq_80be356aef4f71329822694d | [
"1"
] | ELECTRON MICROSCOPY | 2.9 | 2026-04-22 | 0.685965 | 1 | extended | seq_0b1744cbd74dc2a14a5c400a | struct_a8a537e9c54fb73b | component_3f8b289bd5ed90ed | train | 75 | 3e0c_A |
10be_C | 10be | C | A | 3 | GAMGSMDYKDDDDKMYSGAGPALAPPAPPPPIQGYAFKPPPRPDFGTSGRTIKLQANFFEMDIPKIDIYHYELDIKPEKCPRRVNREIVEHMVQHFKTQIFGDRKPVFDGRKNLYTAMPLPIGRDKVELEVTLPGEGKDRIFKVSIKWVSCVSLQALHDALSGRLPSVPFETIQALDVVMRHLPSMRYTPVGRSFFTASEGCSNPLGGGREVWFGFHQSVRPSLWKMMLNIDVSATAFYKAQPVIEFVCEVLDFKSIEEQQKPLTDSQRVKFTKEIKGLKVEITHCGQMKRKYRVCNVTRRPASHQTFPLQQESGQTVEC... | seq_96fd5a59357343cf7a22afc0 | [
"1"
] | ELECTRON MICROSCOPY | 3.02 | 2026-06-03 | 0.907216 | 1 | core | seq_4bd5ef67c7a40efa13266d24 | struct_fb89371558e09729 | component_3f8b289bd5ed90ed | train | 1 | 10be_C |
10bl_A | 10bl | A | A | 1 | MEKVTKDDFESLDVLGKGSFAYVVLVRRIGTNEYYAMKVVNKQGLLDHNRYRDVFVERNVLSRINHPYLLKLYWTFQSEHKLFFVMEYMPGGDLDKYMNNLPSKQFDLFTAKLYAAEILLALLFLHEHSVIYRDLKPENILLTGDGHCVLADFGLSKDFYNPKEGGDASTKDMRANSFVGSPFYVAPDVLKQSEYTNAVDFWSFGILLYRMLCGRTPFNGKSMREVFDNILYSDLRFPSSVQLPSEAKDLISRLLIKDANRRIKGPEIKAHLFWTGINFDEVMERKVKPPKWVPIPSPEQVMAERAKAEGASTSAKNPGQ... | seq_ce9fe9a75ebf0fd5af718434 | [
"1"
] | X-RAY DIFFRACTION | 2.6 | 2026-01-21 | 0.925208 | 1 | core | seq_c2e80c6e24279dcc21792c38 | struct_bbe510513bfc4bc5 | component_3f8b289bd5ed90ed | train | 10 | 10bl_A |
10bl_B | 10bl | B | B | 1 | MEKVTKDDFESLDVLGKGSFAYVVLVRRIGTNEYYAMKVVNKQGLLDHNRYRDVFVERNVLSRINHPYLLKLYWTFQSEHKLFFVMEYMPGGDLDKYMNNLPSKQFDLFTAKLYAAEILLALLFLHEHSVIYRDLKPENILLTGDGHCVLADFGLSKDFYNPKEGGDASTKDMRANSFVGSPFYVAPDVLKQSEYTNAVDFWSFGILLYRMLCGRTPFNGKSMREVFDNILYSDLRFPSSVQLPSEAKDLISRLLIKDANRRIKGPEIKAHLFWTGINFDEVMERKVKPPKWVPIPSPEQVMAERAKAEGASTSAKNPGQ... | seq_ce9fe9a75ebf0fd5af718434 | [
"1"
] | X-RAY DIFFRACTION | 2.6 | 2026-01-21 | 0.894737 | 1 | core | seq_c2e80c6e24279dcc21792c38 | struct_bbe510513bfc4bc5 | component_3f8b289bd5ed90ed | train | 10 | 10bl_A |
10bm_A | 10bm | A | A | 1 | MAHHHHHHSPILPGAWLGMVGGGQLGRMFCFAAQAMGYRVAVLDPDENSPAGAVADRHLRAAYNDEASLTELARLCAAVSTEFENVPAASLDFLARTTFVSPAGRCVAVAQDRIAEKRFIASSGVTVAPHVVIESSDALAALDDAKLEAVLPGILKTARMGYDGKGQIRVRNAEEVREAHASLAGVPCVLEKRLPLKFEVSALIARAASGASVVYPLAQNTHRDGVLSHTIVPAPDASPTLVQQAQQAALQIADKLGYVGVLCVEFFILEDGSLVANEMAPRPHNSGHYTVDACATSQFEQQVRAMTGMPLGDTRQHSPA... | seq_cddf9cb4fec978452f2d8fd7 | [
"1"
] | X-RAY DIFFRACTION | 2.49 | 2026-01-21 | 0.97733 | 1 | core | seq_3bcb3f500f24a67384287a21 | struct_f42856f5e6985860 | component_3f8b289bd5ed90ed | train | 18 | 9zoi_A |
10bm_B | 10bm | B | B | 1 | MAHHHHHHSPILPGAWLGMVGGGQLGRMFCFAAQAMGYRVAVLDPDENSPAGAVADRHLRAAYNDEASLTELARLCAAVSTEFENVPAASLDFLARTTFVSPAGRCVAVAQDRIAEKRFIASSGVTVAPHVVIESSDALAALDDAKLEAVLPGILKTARMGYDGKGQIRVRNAEEVREAHASLAGVPCVLEKRLPLKFEVSALIARAASGASVVYPLAQNTHRDGVLSHTIVPAPDASPTLVQQAQQAALQIADKLGYVGVLCVEFFILEDGSLVANEMAPRPHNSGHYTVDACATSQFEQQVRAMTGMPLGDTRQHSPA... | seq_cddf9cb4fec978452f2d8fd7 | [
"2"
] | X-RAY DIFFRACTION | 2.49 | 2026-01-21 | 0.964736 | 1 | core | seq_3bcb3f500f24a67384287a21 | struct_f42856f5e6985860 | component_3f8b289bd5ed90ed | train | 18 | 9zoi_A |
10bm_C | 10bm | C | C | 1 | MAHHHHHHSPILPGAWLGMVGGGQLGRMFCFAAQAMGYRVAVLDPDENSPAGAVADRHLRAAYNDEASLTELARLCAAVSTEFENVPAASLDFLARTTFVSPAGRCVAVAQDRIAEKRFIASSGVTVAPHVVIESSDALAALDDAKLEAVLPGILKTARMGYDGKGQIRVRNAEEVREAHASLAGVPCVLEKRLPLKFEVSALIARAASGASVVYPLAQNTHRDGVLSHTIVPAPDASPTLVQQAQQAALQIADKLGYVGVLCVEFFILEDGSLVANEMAPRPHNSGHYTVDACATSQFEQQVRAMTGMPLGDTRQHSPA... | seq_cddf9cb4fec978452f2d8fd7 | [
"3"
] | X-RAY DIFFRACTION | 2.49 | 2026-01-21 | 0.979849 | 1 | core | seq_3bcb3f500f24a67384287a21 | struct_f42856f5e6985860 | component_3f8b289bd5ed90ed | train | 18 | 9zoi_A |
10bm_D | 10bm | D | D | 1 | MAHHHHHHSPILPGAWLGMVGGGQLGRMFCFAAQAMGYRVAVLDPDENSPAGAVADRHLRAAYNDEASLTELARLCAAVSTEFENVPAASLDFLARTTFVSPAGRCVAVAQDRIAEKRFIASSGVTVAPHVVIESSDALAALDDAKLEAVLPGILKTARMGYDGKGQIRVRNAEEVREAHASLAGVPCVLEKRLPLKFEVSALIARAASGASVVYPLAQNTHRDGVLSHTIVPAPDASPTLVQQAQQAALQIADKLGYVGVLCVEFFILEDGSLVANEMAPRPHNSGHYTVDACATSQFEQQVRAMTGMPLGDTRQHSPA... | seq_cddf9cb4fec978452f2d8fd7 | [
"4"
] | X-RAY DIFFRACTION | 2.49 | 2026-01-21 | 0.967254 | 1 | core | seq_3bcb3f500f24a67384287a21 | struct_f42856f5e6985860 | component_3f8b289bd5ed90ed | train | 18 | 9zoi_A |
10br_A | 10br | A | A | 1 | GPLGSIESAWLGISFYPLKTRDSEVLKSLGVESNDVSAAIIASLYPGSPAVKSGLRAGDIIMKVNGVSMSVFQDVTSYISDFYAGEKVNVEILRGNVKKNIEIVLAVRPKDKELSSSKMLPGFVVYPLVEDIKAQLNLRNWIKGVVVDYIDKNLASNIKMKSGDVILSVNSKSVSNLREFYDALEVGKNTYKILRGNDSFKITF | seq_86769b4f7e15dccaa1580cc4 | [
"1"
] | X-RAY DIFFRACTION | 1.5 | 2026-06-17 | 1 | 1 | core | seq_86769b4f7e15dccaa1580cc4 | struct_905e0881dd84d01e | component_56c9ada516b64618 | train | 4 | 10br_A |
10br_B | 10br | B | B | 1 | GPLGSIESAWLGISFYPLKTRDSEVLKSLGVESNDVSAAIIASLYPGSPAVKSGLRAGDIIMKVNGVSMSVFQDVTSYISDFYAGEKVNVEILRGNVKKNIEIVLAVRPKDKELSSSKMLPGFVVYPLVEDIKAQLNLRNWIKGVVVDYIDKNLASNIKMKSGDVILSVNSKSVSNLREFYDALEVGKNTYKILRGNDSFKITF | seq_86769b4f7e15dccaa1580cc4 | [
"1"
] | X-RAY DIFFRACTION | 1.5 | 2026-06-17 | 0.97549 | 1 | core | seq_86769b4f7e15dccaa1580cc4 | struct_905e0881dd84d01e | component_56c9ada516b64618 | train | 4 | 10br_A |
10br_C | 10br | C | C | 1 | GPLGSIESAWLGISFYPLKTRDSEVLKSLGVESNDVSAAIIASLYPGSPAVKSGLRAGDIIMKVNGVSMSVFQDVTSYISDFYAGEKVNVEILRGNVKKNIEIVLAVRPKDKELSSSKMLPGFVVYPLVEDIKAQLNLRNWIKGVVVDYIDKNLASNIKMKSGDVILSVNSKSVSNLREFYDALEVGKNTYKILRGNDSFKITF | seq_86769b4f7e15dccaa1580cc4 | [
"2"
] | X-RAY DIFFRACTION | 1.5 | 2026-06-17 | 0.97549 | 1 | core | seq_86769b4f7e15dccaa1580cc4 | struct_905e0881dd84d01e | component_56c9ada516b64618 | train | 4 | 10br_A |
10br_D | 10br | D | D | 1 | GPLGSIESAWLGISFYPLKTRDSEVLKSLGVESNDVSAAIIASLYPGSPAVKSGLRAGDIIMKVNGVSMSVFQDVTSYISDFYAGEKVNVEILRGNVKKNIEIVLAVRPKDKELSSSKMLPGFVVYPLVEDIKAQLNLRNWIKGVVVDYIDKNLASNIKMKSGDVILSVNSKSVSNLREFYDALEVGKNTYKILRGNDSFKITF | seq_86769b4f7e15dccaa1580cc4 | [
"2"
] | X-RAY DIFFRACTION | 1.5 | 2026-06-17 | 1 | 1 | core | seq_86769b4f7e15dccaa1580cc4 | struct_905e0881dd84d01e | component_56c9ada516b64618 | train | 4 | 10br_A |
10bt_A | 10bt | A | A | 1 | EVKLEESGGGLVQPGGSMRLSCVASGFTFSNYWMNWVRQSPEKGLEWVAEIRLKSNNYATHYAESVKGRFTISRDDSTSSGYLQMNNLRTEDTGIHYCTLTLITDYDVMEYWGQGTSVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSCDKTHHHHHH | seq_52a0661b7733bda7e68395ad | [
"1"
] | X-RAY DIFFRACTION | 1.99 | 2026-06-10 | 0.952991 | 1 | core | seq_18e826e63cb5b287c0599278 | struct_277beb1d82fc6a91 | component_3f8b289bd5ed90ed | train | 4 | 10bt_A |
10bt_B | 10bt | B | B | 1 | EVKLEESGGGLVQPGGSMRLSCVASGFTFSNYWMNWVRQSPEKGLEWVAEIRLKSNNYATHYAESVKGRFTISRDDSTSSGYLQMNNLRTEDTGIHYCTLTLITDYDVMEYWGQGTSVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSCDKTHHHHHH | seq_52a0661b7733bda7e68395ad | [
"2"
] | X-RAY DIFFRACTION | 1.99 | 2026-06-10 | 0.940171 | 1 | core | seq_18e826e63cb5b287c0599278 | struct_f1cc39e7021627f2 | component_3f8b289bd5ed90ed | train | 4 | 10bt_A |
10bt_C | 10bt | C | C | 1 | EVKLEESGGGLVQPGGSMRLSCVASGFTFSNYWMNWVRQSPEKGLEWVAEIRLKSNNYATHYAESVKGRFTISRDDSTSSGYLQMNNLRTEDTGIHYCTLTLITDYDVMEYWGQGTSVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSCDKTHHHHHH | seq_52a0661b7733bda7e68395ad | [
"3"
] | X-RAY DIFFRACTION | 1.99 | 2026-06-10 | 0.91453 | 1 | core | seq_18e826e63cb5b287c0599278 | struct_277beb1d82fc6a91 | component_3f8b289bd5ed90ed | train | 4 | 10bt_A |
10bt_D | 10bt | D | D | 1 | EVKLEESGGGLVQPGGSMRLSCVASGFTFSNYWMNWVRQSPEKGLEWVAEIRLKSNNYATHYAESVKGRFTISRDDSTSSGYLQMNNLRTEDTGIHYCTLTLITDYDVMEYWGQGTSVTVSSASTKGPSVFPLAPSSKSTSGGTAALGCLVKDYFPEPVTVSWNSGALTSGVHTFPAVLQSSGLYSLSSVVTVPSSSLGTQTYICNVNHKPSNTKVDKKVEPKSCDKTHHHHHH | seq_52a0661b7733bda7e68395ad | [
"4"
] | X-RAY DIFFRACTION | 1.99 | 2026-06-10 | 0.940171 | 1 | core | seq_18e826e63cb5b287c0599278 | struct_277beb1d82fc6a91 | component_3f8b289bd5ed90ed | train | 4 | 10bt_A |
10bt_E | 10bt | E | E | 2 | DIQMTQSPSSLSASLGGKVTITCKANQDINKYIAWYQHKPGQGPRLLIHYASALQPGIPSRFSGSGSGRDYSFSISNLEPEDIATYYCLQYDNLYTFGGGTKLEIKRARTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC | seq_157d00c820376fd723c3d257 | [
"1"
] | X-RAY DIFFRACTION | 1.99 | 2026-06-10 | 1 | 1 | core | seq_67bd7e2cba6e8d057f61d4fb | struct_69c04d1a82b73f90 | component_3f8b289bd5ed90ed | train | 4 | 10bt_E |
10bt_F | 10bt | F | F | 2 | DIQMTQSPSSLSASLGGKVTITCKANQDINKYIAWYQHKPGQGPRLLIHYASALQPGIPSRFSGSGSGRDYSFSISNLEPEDIATYYCLQYDNLYTFGGGTKLEIKRARTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC | seq_157d00c820376fd723c3d257 | [
"2"
] | X-RAY DIFFRACTION | 1.99 | 2026-06-10 | 1 | 1 | core | seq_67bd7e2cba6e8d057f61d4fb | struct_69c04d1a82b73f90 | component_3f8b289bd5ed90ed | train | 4 | 10bt_E |
10bt_G | 10bt | G | G | 2 | DIQMTQSPSSLSASLGGKVTITCKANQDINKYIAWYQHKPGQGPRLLIHYASALQPGIPSRFSGSGSGRDYSFSISNLEPEDIATYYCLQYDNLYTFGGGTKLEIKRARTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC | seq_157d00c820376fd723c3d257 | [
"3"
] | X-RAY DIFFRACTION | 1.99 | 2026-06-10 | 1 | 1 | core | seq_67bd7e2cba6e8d057f61d4fb | struct_69c04d1a82b73f90 | component_3f8b289bd5ed90ed | train | 4 | 10bt_E |
10bt_H | 10bt | H | H | 2 | DIQMTQSPSSLSASLGGKVTITCKANQDINKYIAWYQHKPGQGPRLLIHYASALQPGIPSRFSGSGSGRDYSFSISNLEPEDIATYYCLQYDNLYTFGGGTKLEIKRARTVAAPSVFIFPPSDEQLKSGTASVVCLLNNFYPREAKVQWKVDNALQSGNSQESVTEQDSKDSTYSLSSTLTLSKADYEKHKVYACEVTHQGLSSPVTKSFNRGEC | seq_157d00c820376fd723c3d257 | [
"4"
] | X-RAY DIFFRACTION | 1.99 | 2026-06-10 | 1 | 1 | core | seq_67bd7e2cba6e8d057f61d4fb | struct_69c04d1a82b73f90 | component_3f8b289bd5ed90ed | train | 4 | 10bt_E |
10bu_A | 10bu | A | A | 1 | MMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSTGEIPAPLAGTVSKILVKEGDTVKAGQTVLVLEAMKMETEINAPTDGKVEKVLVKERDAVQGGQGLIKIGGGTP... | seq_9f36cbab56bf103bcb6f152d | [
"1"
] | ELECTRON MICROSCOPY | 3.2 | 2026-05-27 | 0.998991 | 1 | core | seq_b360e235ec9237254a4dc51a | struct_f23e1e64a56e6400 | component_3f8b289bd5ed90ed | train | 3 | 10bu_A |
10bu_B | 10bu | B | B | 1 | MMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSTGEIPAPLAGTVSKILVKEGDTVKAGQTVLVLEAMKMETEINAPTDGKVEKVLVKERDAVQGGQGLIKIGGGTP... | seq_9f36cbab56bf103bcb6f152d | [
"1"
] | ELECTRON MICROSCOPY | 3.2 | 2026-05-27 | 0.998991 | 1 | core | seq_b360e235ec9237254a4dc51a | struct_f23e1e64a56e6400 | component_3f8b289bd5ed90ed | train | 3 | 10bu_A |
10bu_C | 10bu | C | C | 1 | MMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSTGEIPAPLAGTVSKILVKEGDTVKAGQTVLVLEAMKMETEINAPTDGKVEKVLVKERDAVQGGQGLIKIGGGTP... | seq_9f36cbab56bf103bcb6f152d | [
"1"
] | ELECTRON MICROSCOPY | 3.2 | 2026-05-27 | 0.995964 | 1 | core | seq_b360e235ec9237254a4dc51a | struct_f23e1e64a56e6400 | component_3f8b289bd5ed90ed | train | 3 | 10bu_A |
30bt_A | 30bt | A | A | 1 | MIAAPLVRVTLAYICGLLLASRITVGPVQLLALTVILWTLAYLFRQPPRRAAWQAFLLAGFMALGLLISTWDSSHHQSRLTGDRGTFLDLSGTVIEEPRVYANRVVYTLATREIRQGDYHKRVKEKVQVVLYRPAEGGEPELYRYGDVLRVHGQLAAPPAARNPGELDYRAYLARQYIYNRMLINDPRAIVKLGTVPGHPLVRLALGAKARVKTVITAALPPRQAGILAALLFGDVNELTDTDSDTFKNLGVFHFFAVSGSNTALVLLILMAIAGFLGLERSGAVFLGLAGLIFYAAVTGFTPSVSRAGIMAGLGLIAYL... | seq_52af76c97b47f395dd15cf86 | [
"1"
] | ELECTRON MICROSCOPY | 4.2 | 2026-05-20 | 0.340824 | 1 | low_quality | seq_52af76c97b47f395dd15cf86 | struct_5f54bba25646e9a1 | component_3f8b289bd5ed90ed | train | 3 | 30bu_A |
30bu_A | 30bu | A | A | 1 | MIAAPLVRVTLAYICGLLLASRITVGPVQLLALTVILWTLAYLFRQPPRRAAWQAFLLAGFMALGLLISTWDSSHHQSRLTGDRGTFLDLSGTVIEEPRVYANRVVYTLATREIRQGDYHKRVKEKVQVVLYRPAEGGEPELYRYGDVLRVHGQLAAPPAARNPGELDYRAYLARQYIYNRMLINDPRAIVKLGTVPGHPLVRLALGAKARVKTVITAALPPRQAGILAALLFGDVNELTDTDSDTFKNLGVFHFFAVSGSNTALVLLILMAIAGFLGLERSGAVFLGLAGLIFYAAVTGFTPSVSRAGIMAGLGLIAYL... | seq_52af76c97b47f395dd15cf86 | [
"1"
] | ELECTRON MICROSCOPY | 4.1 | 2026-05-20 | 0.659176 | 1 | extended | seq_52af76c97b47f395dd15cf86 | struct_83ec445fdf12ee88 | component_3f8b289bd5ed90ed | train | 3 | 30bu_A |
30bu_B | 30bu | B | B | 1 | MIAAPLVRVTLAYICGLLLASRITVGPVQLLALTVILWTLAYLFRQPPRRAAWQAFLLAGFMALGLLISTWDSSHHQSRLTGDRGTFLDLSGTVIEEPRVYANRVVYTLATREIRQGDYHKRVKEKVQVVLYRPAEGGEPELYRYGDVLRVHGQLAAPPAARNPGELDYRAYLARQYIYNRMLINDPRAIVKLGTVPGHPLVRLALGAKARVKTVITAALPPRQAGILAALLFGDVNELTDTDSDTFKNLGVFHFFAVSGSNTALVLLILMAIAGFLGLERSGAVFLGLAGLIFYAAVTGFTPSVSRAGIMAGLGLIAYL... | seq_52af76c97b47f395dd15cf86 | [
"1"
] | ELECTRON MICROSCOPY | 4.1 | 2026-05-20 | 0.619226 | 1 | extended | seq_52af76c97b47f395dd15cf86 | struct_83ec445fdf12ee88 | component_3f8b289bd5ed90ed | train | 3 | 30bu_A |
10dc_A | 10dc | A | A | 1 | MTEYKLVVVGAGGVGKSALTIQLIQNHFVDEYDPTIEDSYRKQVVIDGETCLLDILDTAGQEEYSAMADQYMRTGEGFLCVFAINNTKSFEDIHQYREQIKRVKDSDDVPMVLVGNKCDLAARTVESRQAQDLARSYGIPYIETSAKTRQGVEDAFYTLVREIRQH | seq_04fdee737523926977ff5491 | [
"1"
] | X-RAY DIFFRACTION | 2.08 | 2026-02-11 | 0.975904 | 1 | core | seq_747ca141edd1a6d25946ca51 | struct_04fe40d84ea9653a | component_3f8b289bd5ed90ed | train | 1 | 10dc_A |
10dj_A | 10dj | A | A | 1 | VWEIPRESLQLIKRLGNGQFGEVWMGTWNGNTKVAIKTLKPGTMSPESFLEEAQIMKKLKHDKLVQLYAVVSEEPIYIVTEYMNKGSLLDFLKDGEGRALKLPNLVDMAAQVAAGMAYIERMNYIHRDLRSANILVGNGLICKIADFGLARLIEDNEYTARQGAKFPIKWTAPEAALYGRFTIKSDVWSFGILLTELVTKGRVPYPGMNNREVLEQVERGYRMPCPQDCPISLHELMIHCWKKDPEERPTFEYLQSFLEDYFTATEPQYQPGENLVDENLYF | seq_925babf455e1a2da5207ed61 | [
"1"
] | X-RAY DIFFRACTION | 2.22 | 2026-03-18 | 0.953901 | 1 | core | seq_49d757fa60ff99b0d2bc2a03 | struct_d38926c0a86ec433 | component_3f8b289bd5ed90ed | train | 2 | 10dj_B |
10dj_B | 10dj | B | B | 1 | VWEIPRESLQLIKRLGNGQFGEVWMGTWNGNTKVAIKTLKPGTMSPESFLEEAQIMKKLKHDKLVQLYAVVSEEPIYIVTEYMNKGSLLDFLKDGEGRALKLPNLVDMAAQVAAGMAYIERMNYIHRDLRSANILVGNGLICKIADFGLARLIEDNEYTARQGAKFPIKWTAPEAALYGRFTIKSDVWSFGILLTELVTKGRVPYPGMNNREVLEQVERGYRMPCPQDCPISLHELMIHCWKKDPEERPTFEYLQSFLEDYFTATEPQYQPGENLVDENLYF | seq_925babf455e1a2da5207ed61 | [
"2"
] | X-RAY DIFFRACTION | 2.22 | 2026-03-18 | 0.98227 | 1 | core | seq_49d757fa60ff99b0d2bc2a03 | struct_d38926c0a86ec433 | component_3f8b289bd5ed90ed | train | 2 | 10dj_B |
10dk_A | 10dk | A | A | 1 | MATPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSSGGTPKLVLYSEDVNMETPDTHLSYKPGKSDDNSKAMLGQQSMPNRPNYIAFRDNFIGLMYYNSTGNMG... | seq_0e2ee9f45935c6263d849e83 | [
"1"
] | ELECTRON MICROSCOPY | 3.22 | 2026-05-27 | 0.9946 | 1 | core | seq_b360e235ec9237254a4dc51a | struct_f23e1e64a56e6400 | component_3f8b289bd5ed90ed | train | 3 | 10dk_B |
10dk_B | 10dk | B | B | 1 | MATPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSSGGTPKLVLYSEDVNMETPDTHLSYKPGKSDDNSKAMLGQQSMPNRPNYIAFRDNFIGLMYYNSTGNMG... | seq_0e2ee9f45935c6263d849e83 | [
"1"
] | ELECTRON MICROSCOPY | 3.22 | 2026-05-27 | 0.99568 | 1 | core | seq_b360e235ec9237254a4dc51a | struct_f23e1e64a56e6400 | component_3f8b289bd5ed90ed | train | 3 | 10dk_B |
10dk_C | 10dk | C | C | 1 | MATPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSSGGTPKLVLYSEDVNMETPDTHLSYKPGKSDDNSKAMLGQQSMPNRPNYIAFRDNFIGLMYYNSTGNMG... | seq_0e2ee9f45935c6263d849e83 | [
"1"
] | ELECTRON MICROSCOPY | 3.22 | 2026-05-27 | 0.9946 | 1 | core | seq_b360e235ec9237254a4dc51a | struct_f23e1e64a56e6400 | component_3f8b289bd5ed90ed | train | 3 | 10dk_B |
10dp_A | 10dp | A | A | 1 | TPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDTQVQVAAEDDQDDDEEEEQLPQQRNGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSVNAMNEANAIQPKLLLYSEDVNMETPDTHLSYKPGKSDDNSKAMLG... | seq_6ec82d74f63c3dbd66c7a119 | [
"1"
] | ELECTRON MICROSCOPY | 3.25 | 2026-05-27 | 0.970711 | 1 | core | seq_b360e235ec9237254a4dc51a | struct_f23e1e64a56e6400 | component_3f8b289bd5ed90ed | train | 3 | 10dp_A |
10dp_B | 10dp | B | B | 1 | TPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDTQVQVAAEDDQDDDEEEEQLPQQRNGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSVNAMNEANAIQPKLLLYSEDVNMETPDTHLSYKPGKSDDNSKAMLG... | seq_6ec82d74f63c3dbd66c7a119 | [
"1"
] | ELECTRON MICROSCOPY | 3.25 | 2026-05-27 | 0.970711 | 1 | core | seq_b360e235ec9237254a4dc51a | struct_f23e1e64a56e6400 | component_3f8b289bd5ed90ed | train | 3 | 10dp_A |
10dp_C | 10dp | C | C | 1 | TPSMMPQWSYMHISGQDASEYLSPGLVQFARATETYFSLNNKFRNPTVAPTHDVTTDRSQRLTLRFIPVDREDTAYSYKARFTLAVGDNRVLDMASTYFDIRGVLDRGPTFKPYSGTAYNALAPKGAPNSCEWDEDDTQVQVAAEDDQDDDEEEEQLPQQRNGKKTHVYAQAPFAGEAINKNGLQIGTNGAATEGNKEIYADKTYQPEPQIGESQWNEAESSVAGGRVLKKTTPMKPCYGSYARPTNSNGGQGVMVEQNGKLESQVEMQFFSTSVNAMNEANAIQPKLLLYSEDVNMETPDTHLSYKPGKSDDNSKAMLG... | seq_6ec82d74f63c3dbd66c7a119 | [
"1"
] | ELECTRON MICROSCOPY | 3.25 | 2026-05-27 | 0.969665 | 1 | core | seq_b360e235ec9237254a4dc51a | struct_f23e1e64a56e6400 | component_3f8b289bd5ed90ed | train | 3 | 10dp_A |
10dv_A | 10dv | A | A | 1 | SGFRKMAFPSGKVEGCMVQVTCGTTTLNGLWLDDVVYCPRHVICTSEDMLNPNYEDLLIRKSNHNFLVQAGNVQLRVIGHSMQNCVLKLKVDTANPKTPKYKFVRIQPGQTFSVLACYNGSPSGVYQCAMRPNFTIKGSFLNGSAGSVGFNIDYDCVSFCYMHHMELPTGVHAGTDLEGNFYGPFVDRQTAQAAGTDTTITVNVLAWLYAAVINGDRWFLNRFTTTLNDFNLVAMKYNYEPLTQDHVDILGPLSAQTGIAVLDMCASLKELLQNGMNGRTILGSALLEDEFTPFDVVRQCSGVTFQSAVMQYKLILNGKT... | seq_3f7754e0a895ca6e7a129a68 | [
"1"
] | X-RAY DIFFRACTION | 2.05 | 2026-05-06 | 0.806971 | 1 | core | seq_2fdfb46ec3991cba6d737539 | struct_b98635064a47290c | component_3f8b289bd5ed90ed | train | 2 | 10dv_A |
10dv_B | 10dv | B | B | 1 | SGFRKMAFPSGKVEGCMVQVTCGTTTLNGLWLDDVVYCPRHVICTSEDMLNPNYEDLLIRKSNHNFLVQAGNVQLRVIGHSMQNCVLKLKVDTANPKTPKYKFVRIQPGQTFSVLACYNGSPSGVYQCAMRPNFTIKGSFLNGSAGSVGFNIDYDCVSFCYMHHMELPTGVHAGTDLEGNFYGPFVDRQTAQAAGTDTTITVNVLAWLYAAVINGDRWFLNRFTTTLNDFNLVAMKYNYEPLTQDHVDILGPLSAQTGIAVLDMCASLKELLQNGMNGRTILGSALLEDEFTPFDVVRQCSGVTFQSAVMQYKLILNGKT... | seq_3f7754e0a895ca6e7a129a68 | [
"1"
] | X-RAY DIFFRACTION | 2.05 | 2026-05-06 | 0.806971 | 1 | core | seq_2fdfb46ec3991cba6d737539 | struct_b98635064a47290c | component_3f8b289bd5ed90ed | train | 2 | 10dv_A |
10en_A | 10en | A | A | 1 | KIVNIGAVLSTRKHEQMFREAVNQANKRHGSWKIQLNATSVTHKPNAIQMALSVCEDLISSQVYAILVSHPPTPNDHFTPTPVSYTAGFYRIPVLGLTTRMSIYSDKSIHLSFLRTVPPYSHQSSVWFEMMRVYSWNHIILLVSDDHEGRAAQKRLETLLEERESKAEKVLQFDPGTKNVTALLMEARELEARVIILSASEDDAATVYRAAAMLNMTGSGYVWLVGEREISGNALRYAPDGIIGLQLINGKNESAHISDAVGVVAQAVHELLEKENITDPPRGCVGNTNIWKTGPLFKRVLMSSKYADGVTGRVEFNEDG... | seq_7255603097ee423fed8b0c34 | [
"1"
] | ELECTRON MICROSCOPY | 3.7 | 2026-03-25 | 0.973072 | 1 | core | seq_0c6927097c6f94558cbe12bb | struct_14d5849aae0a8126 | component_3f8b289bd5ed90ed | train | 6 | 10en_A |
10en_B | 10en | B | B | 2 | FHHLSVVPRVELVAMNETDPKSIITRICDLMSDRKIQGVVFADDTDQEAIAQILDFISAQTLTPILGIHGGSSMIMADKDESSMFFQFGPSIEQQASVMLNIMEEYDWYIFSIVTTYFPGYQDFVNKIRSTIENSFVGWELEEVLLLDMSLDDGDSKIQNQLKKLQSPIILLYCTKEEATYIFEVANSVGLTGYGYTWIVPSLVAGDTDTVPSEFPTGLISVSYDEWDYGLPARVRDGIAIITTAASDMLSEHSFIPEPKSSCYNTHEKRIYQSNMLNRYLINVTFEGRNLSFSEDGYQMHPKLVIILLNKERKWERVGK... | seq_0b21ed8660d006ae3b501226 | [
"1"
] | ELECTRON MICROSCOPY | 3.7 | 2026-03-25 | 0.955527 | 1 | core | seq_c633012c5d9396303f6c3955 | struct_5f99414d7af5f3ac | component_3f8b289bd5ed90ed | train | 6 | 10en_B |
10en_C | 10en | C | C | 1 | KIVNIGAVLSTRKHEQMFREAVNQANKRHGSWKIQLNATSVTHKPNAIQMALSVCEDLISSQVYAILVSHPPTPNDHFTPTPVSYTAGFYRIPVLGLTTRMSIYSDKSIHLSFLRTVPPYSHQSSVWFEMMRVYSWNHIILLVSDDHEGRAAQKRLETLLEERESKAEKVLQFDPGTKNVTALLMEARELEARVIILSASEDDAATVYRAAAMLNMTGSGYVWLVGEREISGNALRYAPDGIIGLQLINGKNESAHISDAVGVVAQAVHELLEKENITDPPRGCVGNTNIWKTGPLFKRVLMSSKYADGVTGRVEFNEDG... | seq_7255603097ee423fed8b0c34 | [
"1"
] | ELECTRON MICROSCOPY | 3.7 | 2026-03-25 | 0.973072 | 1 | core | seq_0c6927097c6f94558cbe12bb | struct_f9d265a2cd2aaab5 | component_3f8b289bd5ed90ed | train | 6 | 10en_A |
10en_D | 10en | D | D | 2 | FHHLSVVPRVELVAMNETDPKSIITRICDLMSDRKIQGVVFADDTDQEAIAQILDFISAQTLTPILGIHGGSSMIMADKDESSMFFQFGPSIEQQASVMLNIMEEYDWYIFSIVTTYFPGYQDFVNKIRSTIENSFVGWELEEVLLLDMSLDDGDSKIQNQLKKLQSPIILLYCTKEEATYIFEVANSVGLTGYGYTWIVPSLVAGDTDTVPSEFPTGLISVSYDEWDYGLPARVRDGIAIITTAASDMLSEHSFIPEPKSSCYNTHEKRIYQSNMLNRYLINVTFEGRNLSFSEDGYQMHPKLVIILLNKERKWERVGK... | seq_0b21ed8660d006ae3b501226 | [
"1"
] | ELECTRON MICROSCOPY | 3.7 | 2026-03-25 | 0.951715 | 1 | core | seq_c633012c5d9396303f6c3955 | struct_5f99414d7af5f3ac | component_3f8b289bd5ed90ed | train | 6 | 10en_B |
10en_E | 10en | E | E | 3 | DIVLTQSPASLAVSLGQRATISCRASKSVSTSGYSYMNWYQQKAGQPPKLLIYLASNLESGVPARFSGSGSGTDFTLNIHPVEEEDAATYYCQHSRELPYTFGGGTKLEIK | seq_2a897060776f2ba361788d64 | [
"1"
] | ELECTRON MICROSCOPY | 3.7 | 2026-03-25 | 1 | 1 | core | seq_392b87a60783b379b79fea27 | struct_05d89e0f8014586e | component_3f8b289bd5ed90ed | train | 2 | 10en_E |
10en_F | 10en | F | F | 4 | EVQLQQSGPELVKPGASVKMSCKASGYTFTSYVMHWVKQKPGQGLEWIGYINPYSDGTNYNEKFKGKATLTSDKSSSTAYMELSSLTSEDSAVYYCARLTTVVEGAMDYWGQGTSVTVSS | seq_8e8866012ad1f1eb43f44e6d | [
"1"
] | ELECTRON MICROSCOPY | 3.7 | 2026-03-25 | 1 | 1 | core | seq_12249a9611cfdc161bfe7e1c | struct_e1bd67264b90f9fa | component_3f8b289bd5ed90ed | train | 2 | 10en_F |
10en_G | 10en | G | I | 3 | DIVLTQSPASLAVSLGQRATISCRASKSVSTSGYSYMNWYQQKAGQPPKLLIYLASNLESGVPARFSGSGSGTDFTLNIHPVEEEDAATYYCQHSRELPYTFGGGTKLEIK | seq_2a897060776f2ba361788d64 | [
"1"
] | ELECTRON MICROSCOPY | 3.7 | 2026-03-25 | 1 | 1 | core | seq_392b87a60783b379b79fea27 | struct_05d89e0f8014586e | component_3f8b289bd5ed90ed | train | 2 | 10en_E |
10en_H | 10en | H | J | 4 | EVQLQQSGPELVKPGASVKMSCKASGYTFTSYVMHWVKQKPGQGLEWIGYINPYSDGTNYNEKFKGKATLTSDKSSSTAYMELSSLTSEDSAVYYCARLTTVVEGAMDYWGQGTSVTVSS | seq_8e8866012ad1f1eb43f44e6d | [
"1"
] | ELECTRON MICROSCOPY | 3.7 | 2026-03-25 | 1 | 1 | core | seq_12249a9611cfdc161bfe7e1c | struct_c062861de08ab299 | component_3f8b289bd5ed90ed | train | 2 | 10en_F |
10eo_A | 10eo | A | A | 1 | ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV... | seq_d61026e47f4265b59f0b86a6 | [
"1"
] | ELECTRON MICROSCOPY | 3.2 | 2026-05-27 | 0.889746 | 1 | core | seq_bb3a0a9b067359c4dba1d607 | struct_f388146ed7cea03a | component_3f8b289bd5ed90ed | train | 6 | 10eo_A |
10eo_B | 10eo | B | B | 1 | ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV... | seq_d61026e47f4265b59f0b86a6 | [
"1"
] | ELECTRON MICROSCOPY | 3.2 | 2026-05-27 | 0.889746 | 1 | core | seq_bb3a0a9b067359c4dba1d607 | struct_f388146ed7cea03a | component_3f8b289bd5ed90ed | train | 6 | 10eo_A |
10ep_A | 10ep | A | B | 1 | ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV... | seq_d61026e47f4265b59f0b86a6 | [
"1"
] | ELECTRON MICROSCOPY | 3.2 | 2026-05-27 | 0.889746 | 1 | core | seq_bb3a0a9b067359c4dba1d607 | struct_f388146ed7cea03a | component_3f8b289bd5ed90ed | train | 6 | 10eo_A |
10ep_B | 10ep | B | A | 1 | ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV... | seq_d61026e47f4265b59f0b86a6 | [
"1"
] | ELECTRON MICROSCOPY | 3.2 | 2026-05-27 | 0.878721 | 1 | core | seq_bb3a0a9b067359c4dba1d607 | struct_f388146ed7cea03a | component_3f8b289bd5ed90ed | train | 6 | 10eo_A |
10eq_A | 10eq | A | A | 1 | HHHHHHGGASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVP... | seq_ecae2105c114f891ff4a7502 | [
"1"
] | ELECTRON MICROSCOPY | 3.3 | 2026-05-27 | 0.679162 | 1 | extended | seq_bb3a0a9b067359c4dba1d607 | struct_f388146ed7cea03a | component_3f8b289bd5ed90ed | train | 4 | 10es_A |
10eq_B | 10eq | B | B | 1 | HHHHHHGGASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVP... | seq_ecae2105c114f891ff4a7502 | [
"1"
] | ELECTRON MICROSCOPY | 3.3 | 2026-05-27 | 0.888644 | 1 | core | seq_bb3a0a9b067359c4dba1d607 | struct_f388146ed7cea03a | component_3f8b289bd5ed90ed | train | 4 | 10es_A |
10er_A | 10er | A | B | 1 | ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV... | seq_d61026e47f4265b59f0b86a6 | [
"1"
] | ELECTRON MICROSCOPY | 3.2 | 2026-05-27 | 0.878721 | 1 | core | seq_bb3a0a9b067359c4dba1d607 | struct_f388146ed7cea03a | component_3f8b289bd5ed90ed | train | 6 | 10eo_A |
10er_B | 10er | B | A | 1 | ASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVPCGRFPKKV... | seq_d61026e47f4265b59f0b86a6 | [
"1"
] | ELECTRON MICROSCOPY | 3.2 | 2026-05-27 | 0.878721 | 1 | core | seq_bb3a0a9b067359c4dba1d607 | struct_f388146ed7cea03a | component_3f8b289bd5ed90ed | train | 6 | 10eo_A |
10es_A | 10es | A | A | 1 | HHHHHHGGASRSASRLRSLASACSGGAEDGGGTSNGSLSASATATEDDELAIGTGYRLPPPEIRDIVDAPPVPALSFSPHRDKILFLKRRALPPLADLARPEEKLAGVRIDGYCNTRSRMSFYTGLGIHQLLPDGTLSPEKEITGIPDGGKINFVTWSNDGKHLAFSIRVDENGNSSKPVVWVADVETGVARPLFNSQDIFLNAIFESFVWIDNSTLLVSTIPSSRGEPPKKPLVPSGPKTLSNETKTVVQVRTFQDLLKDEYDADLFDYYASSQLVLASLDGTVKEVGVPAVYTSLDPSTDHKYLLVSSLHRPYSFIVP... | seq_ecae2105c114f891ff4a7502 | [
"1"
] | ELECTRON MICROSCOPY | 3 | 2026-05-27 | 0.878721 | 1 | core | seq_bb3a0a9b067359c4dba1d607 | struct_f388146ed7cea03a | component_3f8b289bd5ed90ed | train | 4 | 10es_A |
PDB-Chain-Complex-Benchmark-Rigor
Rigor rebuild of Synthyra/PDB-Chain-Complex-Benchmark with split assignments
recomputed from the published chain and complex parquet artifacts.
Split Policy
Splits are assigned by connected components over exact sequence, sequence hash, 30% sequence cluster, structure cluster, source split component, same-PDB asymmetric-unit membership, chain assembly membership, and biological assembly co-membership from the complex rows. The target is 90/5/5 by component count.
The rebuild hard-fails before upload if any chain or complex member leaks across train, validation, and test by chain UID, sequence, sequence hash, 30% sequence cluster, structure cluster, or recomputed split component.
Complex list-valued payload columns are regenerated from the chain table during
the rebuild, then asserted directly from the emitted payloads, including
asymmetric_unit_chain_uids.
After writing parquet, the builder reloads the emitted chain and complex shards and reruns split-routing, payload-consistency, and disjointness checks from the serialized files.
This artifact-only rebuild does not rerun Foldseek or MMseqs2. It enforces and verifies the published cluster labels plus optional external sequence verification edges when supplied.
Build Metadata
{
"batch_size": 16384,
"chain_scan": {
"assembly_membership_edges_seen": 1138910,
"asymmetric_unit_membership_edges_seen": 1069448,
"chains_scanned": 1069448
},
"chain_write": {
"file_counts": {
"test": 1,
"train": 22,
"valid": 1
},
"row_counts": {
"test": 334,
"train": 1068780,
"valid": 334
}
},
"complex_edge_scan": {
"complex_member_edges_seen": 775327,
"complexes_scanned_for_edges": 363583
},
"complex_write": {
"file_counts": {
"test": 1,
"train": 8,
"valid": 1
},
"member_chain_rows": 1138910,
"member_fields": {
"asymmetric_unit_chain_uids": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 1069448
},
"chain_uid": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 1069448
},
"sequence_clusters_30": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 48857
},
"sequence_hashes": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 183467
},
"sequences": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 183467
},
"split_components": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 6684
},
"structure_clusters": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 66989
}
},
"row_counts": {
"test": 335,
"train": 362909,
"valid": 339
}
},
"component_stats": {
"split_component_count": 6684,
"test_component_count": 334,
"train_component_count": 6016,
"valid_component_count": 334
},
"cpu_count": 32,
"elapsed_seconds": 75.866,
"foldseek_path": "",
"include_source_split_component_edges": true,
"max_rows_per_shard": 50000,
"mmseqs_path": "",
"nvidia-smi_path": "C:\\Windows\\system32\\nvidia-smi.EXE",
"nvidia-smi_version": "Tue Jun 30 18:02:49 2026 \n+-----------------------------------------------------------------------------------------+\n| NVIDIA-SMI 580.88 Driver Version: 580.88 CUDA Version: 13.0 |\n+-----------------------------------------+------------------------+----------------------+\n| GPU Name Driver-Model | Bus-Id Disp.A | Volatile Uncorr. ECC |\n| Fan Temp Perf Pwr:Usage/Cap | Memory-Usage | GPU-Util Compute M. |\n| | | MIG M. |\n|=========================================+========================+======================|\n| 0 NVIDIA GeForce RTX 4070 ... WDDM | 00000000:01:00.0 On | N/A |\n| N/A 41C P8 6W / 121W | 984MiB / 8188MiB | 10% Default |\n| | | N/A |\n+-----------------------------------------+------------------------+----------------------+\n\n+-----------------------------------------------------------------------------------------+\n| Processes: |\n| GPU GI CI PID Type Process name GPU Memory |\n| ID ID Usage |\n|=========================================================================================|\n| 0 N/A N/A 8844 C+G ...indows\\System32\\ShellHost.exe N/A |\n| 0 N/A N/A 10456 C+G ..._cw5n1h2txyewy\\SearchHost.exe N/A |\n| 0 N/A N/A 13212 C+G ...5n1h2txyewy\\TextInputHost.exe N/A |\n| 0 N/A N/A 36048 C+G ...Chrome\\Application\\chrome.exe N/A |\n| 0 N/A N/A 41088 C+G ...ntrolPanel\\SystemSettings.exe N/A |\n| 0 N/A N/A 63696 C+G ...8bbwe\\PhoneExperienceHost.exe N/A |\n| 0 N/A N/A 72372 C+G ...y\\StartMenuExperienceHost.exe N/A |\n| 0 N/A N/A 84244 C+G ...xyewy\\ShellExperienceHost.exe N/A |\n| 0 N/A N/A 104536 C+G C:\\Windows\\explorer.exe N/A |\n| 0 N/A N/A 152648 C+G ....0.4022.80\\msedgewebview2.exe N/A |\n| 0 N/A N/A 152984 C+G ...e Experience\\NVIDIA Share.exe N/A |\n| 0 N/A N/A 155976 C+G ...em32\\ApplicationFrameHost.exe N/A |\n| 0 N/A N/A 162800 C+G ...p\\app-3.6.1\\GitHubDesktop.exe N/A |\n| 0 N/A N/A 196292 C+G ...Chrome\\Application\\chrome.exe N/A |\n| 0 N/A N/A 198076 C+G ...__2p2nqsd0c76g0\\app\\Codex.exe N/A |\n| 0 N/A N/A 206536 C+G ...2txyewy\\CrossDeviceResume.exe N/A |\n| 0 N/A N/A 221536 C+G ...Files\\Notepad++\\notepad++.exe N/A |\n+-----------------------------------------------------------------------------------------+",
"platform": "Windows-11-10.0.26200-SP0",
"python": "3.12.13",
"seed": 42,
"sequence_verification_max_unknown_fraction": 0.0,
"source_chain_rows": 1069448,
"source_complex_rows": 363583,
"source_repo_id": "Synthyra/PDB-Chain-Complex-Benchmark",
"source_snapshot_dir": "C:\\tmp\\hf_pdb_chain_complex_cache\\datasets--Synthyra--PDB-Chain-Complex-Benchmark\\snapshots\\3eb55ee7289dfedfbddf0cde48b68c5395783ccf",
"target_repo_id": "Synthyra/PDB-Chain-Complex-Benchmark-Rigor",
"test_frac": 0.05,
"valid_frac": 0.05
}
Leakage Assertions
{
"chains": {
"fields": {
"chain_uid": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 1069448
},
"seqs": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 183467
},
"sequence_cluster_30": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 48857
},
"sequence_hash": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 183467
},
"split_component": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 6684
},
"structure_cluster": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 66989
}
},
"post_write": {
"fields": {
"chain_uid": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 1069448
},
"seqs": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 183467
},
"sequence_cluster_30": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 48857
},
"sequence_hash": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 183467
},
"split_component": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 6684
},
"structure_cluster": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 66989
}
},
"rows": 1069448,
"split_counts": {
"test": 334,
"train": 1068780,
"valid": 334
}
},
"rows": 1069448,
"sequence_verification_edges": {
"checked_edges": 0,
"cross_split_edges": 0,
"provided": false,
"skipped_self_edges": 0,
"skipped_unknown_edges": 0,
"total_edges": 0
},
"split_counts": {
"test": 334,
"train": 1068780,
"valid": 334
}
},
"complexes": {
"member_chain_rows": 1138910,
"member_fields": {
"asymmetric_unit_chain_uids": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 1069448
},
"chain_uid": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 1069448
},
"sequence_clusters_30": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 48857
},
"sequence_hashes": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 183467
},
"sequences": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 183467
},
"split_components": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 6684
},
"structure_clusters": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 66989
}
},
"member_split_consistency": "passed",
"payload_columns_regenerated_from_chains": true,
"post_write": {
"asymmetric_unit_chain_rows": 1760175,
"member_chain_rows": 1138910,
"member_fields": {
"asymmetric_unit_chain_uids": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 1069448
},
"chain_uid": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 1069448
},
"sequence_clusters_30": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 48857
},
"sequence_hashes": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 183467
},
"sequences": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 183467
},
"split_components": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 6684
},
"structure_clusters": {
"crossing_values": 0,
"max_pairwise_overlap": 0,
"unique_values": 66989
}
},
"payload_columns_match_chain_rows": true,
"rows": 363583,
"shard_split_routing": "passed",
"split_counts": {
"test": 335,
"train": 362909,
"valid": 339
}
},
"rows": 363583,
"split_counts": {
"test": 335,
"train": 362909,
"valid": 339
}
}
}
- Downloads last month
- 11