model.ts 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334
  1. /**
  2. * Copyright (c) 2017-2020 mol* contributors, licensed under MIT, See LICENSE file for more info.
  3. *
  4. * @author David Sehnal <david.sehnal@gmail.com>
  5. * @author Alexander Rose <alexander.rose@weirdbyte.de>
  6. */
  7. import UUID from '../../../mol-util/uuid';
  8. import StructureSequence from './properties/sequence';
  9. import { AtomicHierarchy, AtomicConformation, AtomicRanges } from './properties/atomic';
  10. import { CoarseHierarchy, CoarseConformation } from './properties/coarse';
  11. import { Entities, ChemicalComponentMap, MissingResidues, StructAsymMap } from './properties/common';
  12. import { CustomProperties } from '../../custom-property';
  13. import { SaccharideComponentMap } from '../structure/carbohydrates/constants';
  14. import { ModelFormat } from '../../../mol-model-formats/format';
  15. import { calcModelCenter, getAsymIdCount } from './util';
  16. import { Vec3 } from '../../../mol-math/linear-algebra';
  17. import { Coordinates } from '../coordinates';
  18. import { Topology } from '../topology';
  19. import { Task } from '../../../mol-task';
  20. import { IndexPairBonds } from '../../../mol-model-formats/structure/property/bonds/index-pair';
  21. import { createModels } from '../../../mol-model-formats/structure/basic/parser';
  22. import { MmcifFormat } from '../../../mol-model-formats/structure/mmcif';
  23. import { ChainIndex } from './indexing';
  24. import { SymmetryOperator } from '../../../mol-math/geometry';
  25. import { ModelSymmetry } from '../../../mol-model-formats/structure/property/symmetry';
  26. import { Column } from '../../../mol-data/db';
  27. import { CustomModelProperty } from '../../../mol-model-props/common/custom-model-property';
  28. import { Trajectory, ArrayTrajectory } from '../trajectory';
  29. /**
  30. * Interface to the "source data" of the molecule.
  31. *
  32. * "Atoms" are integers in the range [0, atomCount).
  33. */
  34. export interface Model extends Readonly<{
  35. id: UUID,
  36. entryId: string,
  37. label: string,
  38. /** the name of the entry/file/collection the model is part of */
  39. entry: string,
  40. /**
  41. * corresponds to
  42. * - for IHM: `ihm_model_list.model_id`
  43. * - for standard mmCIF: `atom_site.pdbx_PDB_model_num`
  44. * - for models from coordinates: frame index
  45. */
  46. modelNum: number,
  47. sourceData: ModelFormat,
  48. parent: Model | undefined,
  49. entities: Entities,
  50. sequence: StructureSequence,
  51. atomicHierarchy: AtomicHierarchy,
  52. atomicConformation: AtomicConformation,
  53. atomicRanges: AtomicRanges,
  54. atomicChainOperatorMappinng: Map<ChainIndex, SymmetryOperator>,
  55. properties: {
  56. /** map that holds details about unobserved or zero occurrence residues */
  57. readonly missingResidues: MissingResidues,
  58. /** maps residue name to `ChemicalComponent` data */
  59. readonly chemicalComponentMap: ChemicalComponentMap
  60. /** maps residue name to `SaccharideComponent` data */
  61. readonly saccharideComponentMap: SaccharideComponentMap
  62. /** maps label_asym_id name to `StructAsym` data */
  63. readonly structAsymMap: StructAsymMap
  64. },
  65. customProperties: CustomProperties,
  66. /**
  67. * Not to be accessed directly, each custom property descriptor
  68. * defines property accessors that use this field to store the data.
  69. */
  70. _staticPropertyData: { [name: string]: any },
  71. _dynamicPropertyData: { [name: string]: any },
  72. coarseHierarchy: CoarseHierarchy,
  73. coarseConformation: CoarseConformation
  74. }> {
  75. } { }
  76. export namespace Model {
  77. function _trajectoryFromModelAndCoordinates(model: Model, coordinates: Coordinates) {
  78. const trajectory: Model[] = [];
  79. const { frames } = coordinates;
  80. const srcIndex = model.atomicHierarchy.atoms.sourceIndex;
  81. const isIdentity = Column.isIdentity(srcIndex);
  82. const srcIndexArray = isIdentity ? void 0 : srcIndex.toArray({ array: Int32Array });
  83. for (let i = 0, il = frames.length; i < il; ++i) {
  84. const f = frames[i];
  85. const m = {
  86. ...model,
  87. id: UUID.create22(),
  88. modelNum: i,
  89. atomicConformation: isIdentity
  90. ? Coordinates.getAtomicConformation(f, model.atomicConformation.atomId)
  91. : Coordinates.getAtomicConformationReordered(f, model.atomicConformation.atomId, srcIndexArray!),
  92. // TODO: add support for supplying sphere and gaussian coordinates in addition to atomic coordinates?
  93. // coarseConformation: coarse.conformation,
  94. customProperties: new CustomProperties(),
  95. _staticPropertyData: Object.create(null),
  96. _dynamicPropertyData: Object.create(null)
  97. };
  98. trajectory.push(m);
  99. }
  100. return { trajectory, srcIndexArray };
  101. }
  102. export function trajectoryFromModelAndCoordinates(model: Model, coordinates: Coordinates): Trajectory {
  103. return new ArrayTrajectory(_trajectoryFromModelAndCoordinates(model, coordinates).trajectory);
  104. }
  105. export function invertIndex(xs: ArrayLike<number>) {
  106. const ret = new Int32Array(xs.length);
  107. for (let i = 0, _i = xs.length; i < _i; i++) {
  108. ret[xs[i]] = i;
  109. }
  110. return ret;
  111. }
  112. export function trajectoryFromTopologyAndCoordinates(topology: Topology, coordinates: Coordinates): Task<Trajectory> {
  113. return Task.create('Create Trajectory', async ctx => {
  114. const models = await createModels(topology.basic, topology.sourceData, ctx);
  115. if (models.frameCount === 0) throw new Error('found no model');
  116. const model = models.representative;
  117. const { trajectory, srcIndexArray } = _trajectoryFromModelAndCoordinates(model, coordinates);
  118. // TODO: cache the inverted index somewhere?
  119. const invertedIndex = srcIndexArray ? invertIndex(srcIndexArray) : void 0;
  120. const pairs = srcIndexArray
  121. ? {
  122. indexA: Column.ofIntArray(Column.mapToArray(topology.bonds.indexA, i => invertedIndex![i], Int32Array)),
  123. indexB: Column.ofIntArray(Column.mapToArray(topology.bonds.indexB, i => invertedIndex![i], Int32Array)),
  124. order: topology.bonds.order
  125. }
  126. : topology.bonds;
  127. const bondData = { pairs, count: model.atomicHierarchy.atoms._rowCount };
  128. const indexPairBonds = IndexPairBonds.fromData(bondData);
  129. let index = 0;
  130. for (const m of trajectory) {
  131. IndexPairBonds.Provider.set(m, indexPairBonds);
  132. TrajectoryInfo.set(m, { index: index++, size: trajectory.length });
  133. }
  134. return new ArrayTrajectory(trajectory);
  135. });
  136. }
  137. const CenterProp = '__Center__';
  138. export function getCenter(model: Model): Vec3 {
  139. if (model._dynamicPropertyData[CenterProp]) return model._dynamicPropertyData[CenterProp];
  140. const center = calcModelCenter(model.atomicConformation, model.coarseConformation);
  141. model._dynamicPropertyData[CenterProp] = center;
  142. return center;
  143. }
  144. const TrajectoryInfoProp = '__TrajectoryInfo__';
  145. export type TrajectoryInfo = { readonly index: number, readonly size: number }
  146. export const TrajectoryInfo = {
  147. get(model: Model): TrajectoryInfo {
  148. return model._staticPropertyData[TrajectoryInfoProp] || { index: 0, size: 1 };
  149. },
  150. set(model: Model, trajectoryInfo: TrajectoryInfo) {
  151. return model._staticPropertyData[TrajectoryInfoProp] = trajectoryInfo;
  152. }
  153. };
  154. const AsymIdCountProp = '__AsymIdCount__';
  155. export type AsymIdCount = { readonly auth: number, readonly label: number }
  156. export const AsymIdCount = {
  157. get(model: Model): AsymIdCount {
  158. if (model._staticPropertyData[AsymIdCountProp]) return model._staticPropertyData[AsymIdCountProp];
  159. const asymIdCount = getAsymIdCount(model);
  160. model._staticPropertyData[AsymIdCountProp] = asymIdCount;
  161. return asymIdCount;
  162. },
  163. };
  164. export type AsymIdOffset = { auth: number, label: number };
  165. export const AsymIdOffset = CustomModelProperty.createSimple<AsymIdOffset>('asym_id_offset', 'static');
  166. export type Index = number;
  167. export const Index = CustomModelProperty.createSimple<Index>('index', 'static');
  168. export function getRoot(model: Model) {
  169. return model.parent || model;
  170. }
  171. //
  172. export function hasCarbohydrate(model: Model): boolean {
  173. return model.properties.saccharideComponentMap.size > 0;
  174. }
  175. export function hasProtein(model: Model): boolean {
  176. const { subtype } = model.entities;
  177. for (let i = 0, il = subtype.rowCount; i < il; ++i) {
  178. if (subtype.value(i).startsWith('polypeptide')) return true;
  179. }
  180. return false;
  181. }
  182. export function hasNucleic(model: Model): boolean {
  183. const { subtype } = model.entities;
  184. for (let i = 0, il = subtype.rowCount; i < il; ++i) {
  185. const s = subtype.value(i);
  186. if (s.endsWith('ribonucleotide hybrid') || s.endsWith('ribonucleotide')) return true;
  187. }
  188. return false;
  189. }
  190. export function isFromPdbArchive(model: Model): boolean {
  191. if (!MmcifFormat.is(model.sourceData)) return false;
  192. const { db } = model.sourceData.data;
  193. return (
  194. db.database_2.database_id.isDefined ||
  195. // 4 character PDB id
  196. model.entryId.match(/^[1-9][a-z0-9]{3,3}$/i) !== null ||
  197. // long PDB id
  198. model.entryId.match(/^pdb_[0-9]{4,4}[1-9][a-z0-9]{3,3}$/i) !== null
  199. );
  200. }
  201. export function hasSecondaryStructure(model: Model): boolean {
  202. if (!MmcifFormat.is(model.sourceData)) return false;
  203. const { db } = model.sourceData.data;
  204. return (
  205. db.struct_conf.id.isDefined ||
  206. db.struct_sheet_range.id.isDefined
  207. );
  208. }
  209. const tmpAngles90 = Vec3.create(1.5707963, 1.5707963, 1.5707963); // in radians
  210. const tmpLengths1 = Vec3.create(1, 1, 1);
  211. export function hasCrystalSymmetry(model: Model): boolean {
  212. const spacegroup = ModelSymmetry.Provider.get(model)?.spacegroup;
  213. return !!spacegroup && !(
  214. spacegroup.num === 1 &&
  215. Vec3.equals(spacegroup.cell.anglesInRadians, tmpAngles90) &&
  216. Vec3.equals(spacegroup.cell.size, tmpLengths1)
  217. );
  218. }
  219. export function isFromXray(model: Model): boolean {
  220. if (!MmcifFormat.is(model.sourceData)) return false;
  221. const { db } = model.sourceData.data;
  222. for (let i = 0; i < db.exptl.method.rowCount; i++) {
  223. const v = db.exptl.method.value(i).toUpperCase();
  224. if (v.indexOf('DIFFRACTION') >= 0) return true;
  225. }
  226. return false;
  227. }
  228. export function isFromEm(model: Model): boolean {
  229. if (!MmcifFormat.is(model.sourceData)) return false;
  230. const { db } = model.sourceData.data;
  231. for (let i = 0; i < db.exptl.method.rowCount; i++) {
  232. const v = db.exptl.method.value(i).toUpperCase();
  233. if (v.indexOf('MICROSCOPY') >= 0) return true;
  234. }
  235. return false;
  236. }
  237. export function isFromNmr(model: Model): boolean {
  238. if (!MmcifFormat.is(model.sourceData)) return false;
  239. const { db } = model.sourceData.data;
  240. for (let i = 0; i < db.exptl.method.rowCount; i++) {
  241. const v = db.exptl.method.value(i).toUpperCase();
  242. if (v.indexOf('NMR') >= 0) return true;
  243. }
  244. return false;
  245. }
  246. export function hasXrayMap(model: Model): boolean {
  247. if (!MmcifFormat.is(model.sourceData)) return false;
  248. // Check exprimental method to exclude models solved with
  249. // 'ELECTRON CRYSTALLOGRAPHY' which also have structure factors
  250. if (!isFromXray(model)) return false;
  251. const { db } = model.sourceData.data;
  252. const { status_code_sf } = db.pdbx_database_status;
  253. return status_code_sf.isDefined && status_code_sf.value(0) === 'REL';
  254. }
  255. /**
  256. * Also checks for `content_type` of 'associated EM volume' to exclude cases
  257. * like 6TEK which are solved with 'X-RAY DIFFRACTION' but have an related
  258. * EMDB entry of type 'other EM volume'.
  259. */
  260. export function hasEmMap(model: Model): boolean {
  261. if (!MmcifFormat.is(model.sourceData)) return false;
  262. const { db } = model.sourceData.data;
  263. const { db_name, content_type } = db.pdbx_database_related;
  264. for (let i = 0, il = db.pdbx_database_related._rowCount; i < il; ++i) {
  265. if (db_name.value(i).toUpperCase() === 'EMDB' && content_type.value(i) === 'associated EM volume') {
  266. return true;
  267. }
  268. }
  269. return false;
  270. }
  271. export function hasDensityMap(model: Model): boolean {
  272. if (!MmcifFormat.is(model.sourceData)) return false;
  273. return hasXrayMap(model) || hasEmMap(model);
  274. }
  275. export function probablyHasDensityMap(model: Model): boolean {
  276. if (!MmcifFormat.is(model.sourceData)) return false;
  277. const { db } = model.sourceData.data;
  278. return hasDensityMap(model) || (
  279. // check if from pdb archive but missing relevant meta data
  280. isFromPdbArchive(model) && (
  281. !db.exptl.method.isDefined ||
  282. (isFromXray(model) && (
  283. !db.pdbx_database_status.status_code_sf.isDefined ||
  284. db.pdbx_database_status.status_code_sf.valueKind(0) === Column.ValueKind.Unknown
  285. )) ||
  286. (isFromEm(model) && (
  287. !db.pdbx_database_related.db_name.isDefined
  288. ))
  289. )
  290. );
  291. }
  292. }