symmetry.ts 5.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129
  1. /**
  2. * Copyright (C) 2022, Protein Bioinformatics Research Group, RCNS
  3. *
  4. * Licensed under CC BY-NC 4.0, see LICENSE file for more info.
  5. *
  6. * @author Gabor Tusnady <tusnady.gabor@ttk.hu>
  7. * @author Csongor Gerdan <gerdan.csongor@ttk.hu>
  8. */
  9. import { MmcifFormat } from '../../mol-model-formats/structure/mmcif';
  10. import { Column, Table } from '../../mol-data/db';
  11. import { mmCIF_Schema } from '../../mol-io/reader/cif/schema/mmcif';
  12. import { Model } from '../../mol-model/structure';
  13. import { ModelSymmetry } from '../../mol-model-formats/structure/property/symmetry';
  14. import { PDBTMDescriptor } from './types';
  15. import { DebugUtil } from './debug-utils';
  16. export function registerTmDetSymmetry(pdbtmDescriptor: PDBTMDescriptor) {
  17. ModelSymmetry.Provider.formatRegistry.remove('mmCIF');
  18. const excludedChains = constructChainListFromOperations(pdbtmDescriptor);
  19. ModelSymmetry.Provider.formatRegistry.add('mmCIF', function(model: Model) {
  20. return tmDetSymmetryFromMmCif(model, excludedChains);
  21. });
  22. }
  23. function constructChainListFromOperations(pdbtmDescriptor: PDBTMDescriptor): string[] {
  24. const excludedChains: string[] = [];
  25. // add chain deletes
  26. const biomatrix = pdbtmDescriptor.additional_entry_annotations.biomatrix;
  27. if (biomatrix?.chain_deletes) {
  28. biomatrix.chain_deletes.forEach(
  29. chainId => excludedChains.push(chainId)
  30. );
  31. }
  32. // exclude result of transformations
  33. if (biomatrix?.matrix_list) {
  34. biomatrix.matrix_list.forEach(
  35. matrix => matrix.apply_to_chain_list.forEach(
  36. applyItem => excludedChains.push(applyItem.new_chain_id)
  37. )
  38. );
  39. }
  40. return excludedChains;
  41. }
  42. function tmDetSymmetryFromMmCif(model: Model, excludedChains: string[]) {
  43. if (!MmcifFormat.is(model.sourceData)) return;
  44. let data = model.sourceData.data.db;
  45. let asymIdColumnData: string[][] = [];
  46. // update chains (asym) for each author_defined_assemly
  47. // NOTE: We assume that the first assembly is an author defined assembly.
  48. const currentAssemblyId: string = data.pdbx_struct_assembly_gen.assembly_id.value(0);
  49. excludedChains = union(
  50. excludedChains,
  51. Array.from(data.pdbx_nonpoly_scheme.asym_id.toArray())
  52. );
  53. const result: string[][] = createAsymIdColumnData(
  54. data.pdbx_struct_assembly_gen, currentAssemblyId, excludedChains
  55. );
  56. asymIdColumnData = asymIdColumnData.concat(result);
  57. const asym_id_list_column = Column.ofStringListArray(asymIdColumnData);
  58. // create table with new column
  59. let updated_pdbx_struct_assembly_gen = Table.ofColumns(
  60. data.pdbx_struct_assembly_gen._schema,
  61. {
  62. assembly_id: data.pdbx_struct_assembly_gen.assembly_id,
  63. asym_id_list: asym_id_list_column,
  64. //oper_expression: data.pdbx_struct_assembly_gen.oper_expression
  65. // NOTE: we expect here pdbx_struct_assembly_gen has only one row
  66. oper_expression: Column.ofStringArray([ '1' ])
  67. }
  68. );
  69. DebugUtil.log('Orig. assembly_gen', Table.formatToString(data.pdbx_struct_assembly_gen));
  70. DebugUtil.log('Updated assembly_gen', Table.formatToString(updated_pdbx_struct_assembly_gen));
  71. DebugUtil.log('Oper expression:', data.pdbx_struct_assembly_gen.oper_expression.toArray());
  72. DebugUtil.log('Non-poly entities:', Table.formatToString(data.pdbx_entity_nonpoly));
  73. DebugUtil.log('Non-poly chains:', data.pdbx_nonpoly_scheme.asym_id.toArray());
  74. DebugUtil.log('Excluded chains:', excludedChains);
  75. DebugUtil.log('Included chains:', result);
  76. DebugUtil.log('oper_list table: original:', Table.formatToString(data.pdbx_struct_oper_list));
  77. const only_identity_operation = Table.ofRows(
  78. data.pdbx_struct_oper_list._schema, [ Table.getRow(data.pdbx_struct_oper_list, 0) ]
  79. );
  80. DebugUtil.log('oper_list table: first row', Table.formatToString(only_identity_operation));
  81. return ModelSymmetry.fromData({
  82. symmetry: data.symmetry,
  83. cell: data.cell,
  84. struct_ncs_oper: data.struct_ncs_oper,
  85. atom_sites: data.atom_sites,
  86. pdbx_struct_assembly: data.pdbx_struct_assembly,
  87. pdbx_struct_assembly_gen: updated_pdbx_struct_assembly_gen,
  88. pdbx_struct_oper_list: only_identity_operation
  89. });
  90. }
  91. function createAsymIdColumnData(pdbx_struct_assembly_gen: Table<mmCIF_Schema['pdbx_struct_assembly_gen']>, assemblyId: string, chains: string[]) {
  92. const asym_id_list: string[][] = [];
  93. for (let i = 0; i < pdbx_struct_assembly_gen._rowCount; i++) {
  94. const currentAsymIdList = pdbx_struct_assembly_gen.asym_id_list.value(i);
  95. asym_id_list.push(
  96. (assemblyId == pdbx_struct_assembly_gen.assembly_id.value(i))
  97. ? minus(currentAsymIdList, chains)
  98. : currentAsymIdList
  99. );
  100. }
  101. return asym_id_list;
  102. }
  103. // difference of two string arrays (interpreted as sets)
  104. function minus(a: string[], b: string[]): string[] {
  105. const b_set = new Set(b);
  106. return a.filter(x => !b_set.has(x));
  107. }
  108. // union of two string arrays (interpreted as sets)
  109. function union(a: string[], b: string[]): string[] {
  110. const a_set = new Set(a);
  111. b.forEach(item => a_set.add(item));
  112. return Array.from(a_set.values());
  113. }