123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430 |
- /**
- * Copyright (c) 2017-2023 mol* contributors, licensed under MIT, See LICENSE file for more info.
- *
- * @author David Sehnal <david.sehnal@gmail.com>
- * @author Alexander Rose <alexander.rose@weirdbyte.de>
- */
- import { UUID } from '../../../mol-util/uuid';
- import { StructureSequence } from './properties/sequence';
- import { AtomicHierarchy, AtomicConformation, AtomicRanges } from './properties/atomic';
- import { CoarseHierarchy, CoarseConformation } from './properties/coarse';
- import { Entities, ChemicalComponentMap, MissingResidues, StructAsymMap } from './properties/common';
- import { CustomProperties } from '../../custom-property';
- import { SaccharideComponentMap } from '../structure/carbohydrates/constants';
- import { ModelFormat } from '../../../mol-model-formats/format';
- import { calcModelCenter, getAsymIdCount } from './util';
- import { Vec3 } from '../../../mol-math/linear-algebra';
- import { Coordinates } from '../coordinates';
- import { Topology } from '../topology';
- import { Task } from '../../../mol-task';
- import { IndexPairBonds } from '../../../mol-model-formats/structure/property/bonds/index-pair';
- import { createModels } from '../../../mol-model-formats/structure/basic/parser';
- import { MmcifFormat } from '../../../mol-model-formats/structure/mmcif';
- import { ChainIndex, ElementIndex } from './indexing';
- import { SymmetryOperator } from '../../../mol-math/geometry';
- import { ModelSymmetry } from '../../../mol-model-formats/structure/property/symmetry';
- import { Column } from '../../../mol-data/db';
- import { CustomModelProperty } from '../../../mol-model-props/common/custom-model-property';
- import { Trajectory, ArrayTrajectory } from '../trajectory';
- import { Unit } from '../structure';
- import { SortedArray } from '../../../mol-data/int/sorted-array';
- import { PolymerType } from './types';
- import { ModelSecondaryStructure } from '../../../mol-model-formats/structure/property/secondary-structure';
- /**
- * Interface to the "source data" of the molecule.
- *
- * "Atoms" are integers in the range [0, atomCount).
- */
- export interface Model extends Readonly<{
- id: UUID,
- entryId: string,
- label: string,
- /** the name of the entry/file/collection the model is part of */
- entry: string,
- /**
- * corresponds to
- * - for IHM: `ihm_model_list.model_id`
- * - for standard mmCIF: `atom_site.pdbx_PDB_model_num`
- * - for models from coordinates: frame index
- */
- modelNum: number,
- sourceData: ModelFormat,
- parent: Model | undefined,
- entities: Entities,
- sequence: StructureSequence,
- atomicHierarchy: AtomicHierarchy,
- atomicConformation: AtomicConformation,
- atomicRanges: AtomicRanges,
- atomicChainOperatorMappinng: Map<ChainIndex, SymmetryOperator>,
- properties: {
- /** map that holds details about unobserved or zero occurrence residues */
- readonly missingResidues: MissingResidues,
- /** maps residue name to `ChemicalComponent` data */
- readonly chemicalComponentMap: ChemicalComponentMap
- /** maps residue name to `SaccharideComponent` data */
- readonly saccharideComponentMap: SaccharideComponentMap
- /** maps label_asym_id name to `StructAsym` data */
- readonly structAsymMap: StructAsymMap
- },
- customProperties: CustomProperties,
- /**
- * Not to be accessed directly, each custom property descriptor
- * defines property accessors that use this field to store the data.
- */
- _staticPropertyData: { [name: string]: any },
- _dynamicPropertyData: { [name: string]: any },
- coarseHierarchy: CoarseHierarchy,
- coarseConformation: CoarseConformation
- }> {
- } { }
- export namespace Model {
- function _trajectoryFromModelAndCoordinates(model: Model, coordinates: Coordinates) {
- const trajectory: Model[] = [];
- const { frames } = coordinates;
- const srcIndex = model.atomicHierarchy.atomSourceIndex;
- const isIdentity = Column.isIdentity(srcIndex);
- const srcIndexArray = isIdentity ? void 0 : srcIndex.toArray({ array: Int32Array });
- const coarseGrained = isCoarseGrained(model);
- const elementCount = model.atomicHierarchy.atoms._rowCount;
- for (let i = 0, il = frames.length; i < il; ++i) {
- const f = frames[i];
- if (f.elementCount !== elementCount) {
- throw new Error(`Frame element count mismatch, got ${f.elementCount} but expected ${elementCount}.`);
- }
- const m = {
- ...model,
- id: UUID.create22(),
- modelNum: i,
- atomicConformation: Coordinates.getAtomicConformation(f, {
- atomId: model.atomicConformation.atomId,
- occupancy: model.atomicConformation.occupancy,
- B_iso_or_equiv: model.atomicConformation.B_iso_or_equiv
- }, srcIndexArray),
- // TODO: add support for supplying sphere and gaussian coordinates in addition to atomic coordinates?
- // coarseConformation: coarse.conformation,
- customProperties: new CustomProperties(),
- _staticPropertyData: Object.create(null),
- _dynamicPropertyData: Object.create(null)
- };
- if (f.cell) {
- const symmetry = ModelSymmetry.fromCell(f.cell.size, f.cell.anglesInRadians);
- ModelSymmetry.Provider.set(m, symmetry);
- }
- TrajectoryInfo.set(m, { index: i, size: frames.length });
- CoarseGrained.set(m, coarseGrained);
- trajectory.push(m);
- }
- return { trajectory, srcIndexArray };
- }
- export function trajectoryFromModelAndCoordinates(model: Model, coordinates: Coordinates): Trajectory {
- return new ArrayTrajectory(_trajectoryFromModelAndCoordinates(model, coordinates).trajectory);
- }
- export function trajectoryFromTopologyAndCoordinates(topology: Topology, coordinates: Coordinates): Task<Trajectory> {
- return Task.create('Create Trajectory', async ctx => {
- const models = await createModels(topology.basic, topology.sourceData, ctx);
- if (models.frameCount === 0) throw new Error('found no model');
- const model = models.representative;
- const { trajectory } = _trajectoryFromModelAndCoordinates(model, coordinates);
- const bondData = { pairs: topology.bonds, count: model.atomicHierarchy.atoms._rowCount };
- const indexPairBonds = IndexPairBonds.fromData(bondData);
- const coarseGrained = isCoarseGrained(model);
- let index = 0;
- for (const m of trajectory) {
- IndexPairBonds.Provider.set(m, indexPairBonds);
- TrajectoryInfo.set(m, { index: index++, size: trajectory.length });
- CoarseGrained.set(m, coarseGrained);
- }
- return new ArrayTrajectory(trajectory);
- });
- }
- const CenterProp = '__Center__';
- export function getCenter(model: Model): Vec3 {
- if (model._dynamicPropertyData[CenterProp]) return model._dynamicPropertyData[CenterProp];
- const center = calcModelCenter(model.atomicConformation, model.coarseConformation);
- model._dynamicPropertyData[CenterProp] = center;
- return center;
- }
- function invertIndex(xs: Column<number>) {
- const invertedIndex = new Int32Array(xs.rowCount);
- let isIdentity = false;
- for (let i = 0, _i = xs.rowCount; i < _i; i++) {
- const x = xs.value(i);
- if (x !== i) isIdentity = false;
- invertedIndex[x] = i;
- }
- return { isIdentity, invertedIndex: invertedIndex as unknown as ArrayLike<ElementIndex> };
- }
- const InvertedAtomSrcIndexProp = '__InvertedAtomSrcIndex__';
- export function getInvertedAtomSourceIndex(model: Model): { isIdentity: boolean, invertedIndex: ArrayLike<ElementIndex> } {
- if (model._staticPropertyData[InvertedAtomSrcIndexProp]) return model._staticPropertyData[InvertedAtomSrcIndexProp];
- const index = invertIndex(model.atomicHierarchy.atomSourceIndex);
- model._staticPropertyData[InvertedAtomSrcIndexProp] = index;
- return index;
- }
- const TrajectoryInfoProp = '__TrajectoryInfo__';
- export type TrajectoryInfo = { readonly index: number, readonly size: number }
- export const TrajectoryInfo = {
- get(model: Model): TrajectoryInfo {
- return model._dynamicPropertyData[TrajectoryInfoProp] || { index: 0, size: 1 };
- },
- set(model: Model, trajectoryInfo: TrajectoryInfo) {
- return model._dynamicPropertyData[TrajectoryInfoProp] = trajectoryInfo;
- }
- };
- const AsymIdCountProp = '__AsymIdCount__';
- export type AsymIdCount = { readonly auth: number, readonly label: number }
- export const AsymIdCount = {
- get(model: Model): AsymIdCount {
- if (model._dynamicPropertyData[AsymIdCountProp]) return model._dynamicPropertyData[AsymIdCountProp];
- const asymIdCount = getAsymIdCount(model);
- model._dynamicPropertyData[AsymIdCountProp] = asymIdCount;
- return asymIdCount;
- },
- };
- export type AsymIdOffset = { auth: number, label: number };
- export const AsymIdOffset = CustomModelProperty.createSimple<AsymIdOffset>('asym_id_offset', 'static');
- export type Index = number;
- export const Index = CustomModelProperty.createSimple<Index>('index', 'static');
- export type MaxIndex = number;
- export const MaxIndex = CustomModelProperty.createSimple<MaxIndex>('max_index', 'static');
- export function getRoot(model: Model) {
- return model.parent || model;
- }
- export function areHierarchiesEqual(a: Model, b: Model) {
- return a.atomicHierarchy === b.atomicHierarchy && a.coarseHierarchy === b.coarseHierarchy;
- }
- const CoordinatesHistoryProp = '__CoordinatesHistory__';
- export type CoordinatesHistory = {
- areEqual(elements: SortedArray<ElementIndex>, kind: Unit.Kind, model: Model): boolean
- }
- export const CoordinatesHistory = {
- get(model: Model): CoordinatesHistory | undefined {
- return model._staticPropertyData[CoordinatesHistoryProp];
- },
- set(model: Model, coordinatesHistory: CoordinatesHistory) {
- return model._staticPropertyData[CoordinatesHistoryProp] = coordinatesHistory;
- }
- };
- const CoarseGrainedProp = '__CoarseGrained__';
- export const CoarseGrained = {
- get(model: Model): boolean | undefined {
- return model._staticPropertyData[CoarseGrainedProp];
- },
- set(model: Model, coarseGrained: boolean) {
- return model._staticPropertyData[CoarseGrainedProp] = coarseGrained;
- }
- };
- /**
- * Has typical coarse grained atom names (BB, SC1) or less than three times as many
- * atoms as polymer residues (C-alpha only models).
- */
- export function isCoarseGrained(model: Model): boolean {
- let coarseGrained = CoarseGrained.get(model);
- if (coarseGrained === undefined) {
- let polymerResidueCount = 0;
- const { polymerType } = model.atomicHierarchy.derived.residue;
- for (let i = 0; i < polymerType.length; ++i) {
- if (polymerType[i] !== PolymerType.NA) polymerResidueCount += 1;
- }
- // check for coarse grained atom names
- let hasBB = false, hasSC1 = false;
- const { label_atom_id, _rowCount: atomCount } = model.atomicHierarchy.atoms;
- for (let i = 0; i < atomCount; ++i) {
- const atomName = label_atom_id.value(i);
- if (!hasBB && atomName === 'BB') hasBB = true;
- if (!hasSC1 && atomName === 'SC1') hasSC1 = true;
- if (hasBB && hasSC1) break;
- }
- coarseGrained = (hasBB && hasSC1) || (
- polymerResidueCount && atomCount
- ? atomCount / polymerResidueCount < 3
- : false
- );
- CoarseGrained.set(model, coarseGrained);
- }
- return coarseGrained;
- }
- //
- export function hasCarbohydrate(model: Model): boolean {
- return model.properties.saccharideComponentMap.size > 0;
- }
- export function hasProtein(model: Model): boolean {
- const { subtype } = model.entities;
- for (let i = 0, il = subtype.rowCount; i < il; ++i) {
- if (subtype.value(i).startsWith('polypeptide')) return true;
- }
- return false;
- }
- export function hasNucleic(model: Model): boolean {
- const { subtype } = model.entities;
- for (let i = 0, il = subtype.rowCount; i < il; ++i) {
- const s = subtype.value(i);
- if (s.endsWith('ribonucleotide hybrid') || s.endsWith('ribonucleotide')) return true;
- }
- return false;
- }
- export function isFromPdbArchive(model: Model): boolean {
- if (!MmcifFormat.is(model.sourceData)) return false;
- const { db } = model.sourceData.data;
- for (let i = 0, il = db.database_2.database_id.rowCount; i < il; ++i) {
- if (db.database_2.database_id.value(i) === 'pdb') return true;
- }
- return false;
- }
- export function hasPdbId(model: Model): boolean {
- if (!MmcifFormat.is(model.sourceData)) return false;
- return (
- // 4 character PDB id
- model.entryId.match(/^[1-9][a-z0-9]{3,3}$/i) !== null ||
- // long PDB id
- model.entryId.match(/^pdb_[0-9]{4,4}[1-9][a-z0-9]{3,3}$/i) !== null
- );
- }
- export function hasSecondaryStructure(model: Model): boolean {
- if (MmcifFormat.is(model.sourceData)) {
- const { db } = model.sourceData.data;
- return (
- db.struct_conf.id.isDefined ||
- db.struct_sheet_range.id.isDefined
- );
- } else {
- return ModelSecondaryStructure.Provider.isApplicable(model);
- }
- }
- const tmpAngles90 = Vec3.create(1.5707963, 1.5707963, 1.5707963); // in radians
- const tmpLengths1 = Vec3.create(1, 1, 1);
- export function hasCrystalSymmetry(model: Model): boolean {
- const spacegroup = ModelSymmetry.Provider.get(model)?.spacegroup;
- return !!spacegroup && !(
- spacegroup.num === 1 &&
- Vec3.equals(spacegroup.cell.anglesInRadians, tmpAngles90) &&
- Vec3.equals(spacegroup.cell.size, tmpLengths1)
- );
- }
- export function isFromXray(model: Model): boolean {
- if (!MmcifFormat.is(model.sourceData)) return false;
- const { db } = model.sourceData.data;
- for (let i = 0; i < db.exptl.method.rowCount; i++) {
- const v = db.exptl.method.value(i).toUpperCase();
- if (v.indexOf('DIFFRACTION') >= 0) return true;
- }
- return false;
- }
- export function isFromEm(model: Model): boolean {
- if (!MmcifFormat.is(model.sourceData)) return false;
- const { db } = model.sourceData.data;
- for (let i = 0; i < db.exptl.method.rowCount; i++) {
- const v = db.exptl.method.value(i).toUpperCase();
- if (v.indexOf('MICROSCOPY') >= 0) return true;
- }
- return false;
- }
- export function isFromNmr(model: Model): boolean {
- if (!MmcifFormat.is(model.sourceData)) return false;
- const { db } = model.sourceData.data;
- for (let i = 0; i < db.exptl.method.rowCount; i++) {
- const v = db.exptl.method.value(i).toUpperCase();
- if (v.indexOf('NMR') >= 0) return true;
- }
- return false;
- }
- export function hasXrayMap(model: Model): boolean {
- if (!MmcifFormat.is(model.sourceData)) return false;
- // Check exprimental method to exclude models solved with
- // 'ELECTRON CRYSTALLOGRAPHY' which also have structure factors
- if (!isFromXray(model)) return false;
- const { db } = model.sourceData.data;
- const { status_code_sf } = db.pdbx_database_status;
- return status_code_sf.isDefined && status_code_sf.value(0) === 'REL';
- }
- /**
- * Also checks for `content_type` of 'associated EM volume' to exclude cases
- * like 6TEK which are solved with 'X-RAY DIFFRACTION' but have an related
- * EMDB entry of type 'other EM volume'.
- */
- export function hasEmMap(model: Model): boolean {
- if (!MmcifFormat.is(model.sourceData)) return false;
- const { db } = model.sourceData.data;
- const { db_name, content_type } = db.pdbx_database_related;
- for (let i = 0, il = db.pdbx_database_related._rowCount; i < il; ++i) {
- if (db_name.value(i).toUpperCase() === 'EMDB' && content_type.value(i) === 'associated EM volume') {
- return true;
- }
- }
- return false;
- }
- export function hasDensityMap(model: Model): boolean {
- if (!MmcifFormat.is(model.sourceData)) return false;
- return hasXrayMap(model) || hasEmMap(model);
- }
- export function probablyHasDensityMap(model: Model): boolean {
- if (!MmcifFormat.is(model.sourceData)) return false;
- const { db } = model.sourceData.data;
- return hasDensityMap(model) || (
- // check if from pdb archive but missing relevant meta data
- hasPdbId(model) && (
- !db.exptl.method.isDefined ||
- (isFromXray(model) && (
- !db.pdbx_database_status.status_code_sf.isDefined ||
- db.pdbx_database_status.status_code_sf.valueKind(0) === Column.ValueKinds.Unknown
- )) ||
- (isFromEm(model) && (
- !db.pdbx_database_related.db_name.isDefined
- ))
- )
- );
- }
- }
|