123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227 |
- import { MolScriptBuilder as MS } from 'molstar/lib/mol-script/language/builder';
- import { StructureSelectionQueries as Q } from 'molstar/lib/mol-plugin-state/helpers/structure-selection-query';
- import { StructureRepresentationRegistry } from 'molstar/lib/mol-repr/structure/registry';
- import { Expression } from 'molstar/lib/mol-script/language/expression';
- import { QueryContext, Structure, StructureElement, StructureSelection } from 'molstar/lib/mol-model/structure';
- import { compile } from 'molstar/lib/mol-script/runtime/query/compiler';
- export type Target = {
- readonly auth_seq_id?: number
- readonly label_seq_id?: number
- readonly label_comp_id?: string
- readonly label_asym_id?: string
- /**
- * Mol*-internal representation, like 'ASM_2'. Enumerated in the order of appearance in the source file. Specify the
- * assemblyId when using this selector.
- */
- readonly operatorName?: string
- /**
- * Strucmotif-/BioJava-specific representation, like 'Px42'. This is a single 'pdbx_struct_oper_list.id' value or a
- * combination thereof. Specify the assemblyId when using this selector. Order matters, use order as specified in
- * the source CIF file.
- */
- readonly struct_oper_id?: string
- }
- export type Range = {
- label_asym_id: string
- label_seq_id?: { beg: number, end?: number }
- }
- export const toRange = (start: number, end?: number) => {
- if (!end) return [start];
- const b = start < end ? start : end;
- const e = start < end ? end : start;
- return [...Array(e - b + 1)].map((_, i) => b + i);
- };
- export type SelectionExpression = {
- tag: string
- type: StructureRepresentationRegistry.BuiltIn
- label: string
- expression: Expression
- isHidden?: boolean,
- color?: number
- };
- /**
- * This serves as adapter between the strucmotif-/BioJava-approach to identify transformed chains and the Mol* way.
- * Looks for 'struct_oper_id', converts it to an 'operatorName', and removes the original value. This will
- * override pre-existing 'operatorName' values.
- * @param targets collection to process
- * @param structure parent structure
- * @param operatorName optional value to which missing operators are set, will default to 'ASM_1' if not specified
- */
- export function normalizeTargets(targets: Target[], structure: Structure, operatorName: string = 'ASM_1'): Target[] {
- return targets.map(t => {
- if (t.struct_oper_id) {
- const { struct_oper_id, ...others } = t;
- const oper = toOperatorName(structure, struct_oper_id);
- return { ...others, operatorName: oper };
- }
- return t.operatorName ? t : { ...t, operatorName };
- });
- }
- function toOperatorName(structure: Structure, expression: string): string {
- function join(opers: any[]) {
- // this makes the assumptions that '1' is the identity operator
- if (!opers || !opers.length) return '1';
- if (opers.length > 1) {
- // Mol* operators are right-to-left
- return opers[1] + 'x' + opers[0];
- }
- return opers[0];
- }
- for (const unit of structure.units) {
- const assembly = unit.conformation.operator.assembly;
- if (!assembly) continue;
- if (expression === join(assembly.operList)) return `ASM_${assembly.operId}`;
- }
- // TODO better error handling?
- throw Error(`Unable to find expression '${expression}'`);
- }
- /**
- * Convert a selection to an array of selection expressions.
- * @param labelBase the base label that will appear in the UI (e.g., the entry ID)
- * @param selection a selection by Range or a set of Targets
- */
- export function createSelectionExpressions(labelBase: string, selection?: Range | Target[]): SelectionExpression[] {
- if (selection) {
- if ('label_asym_id' in selection && 'label_seq_id' in selection) {
- const range = selection as Range;
- const residues: number[] = (range.label_seq_id) ? toRange(range.label_seq_id.beg, range.label_seq_id.end) : [];
- const test = rangeToTest(range.label_asym_id, residues);
- const label = labelFromProps(labelBase, range);
- return [{
- expression: MS.struct.generator.atomGroups(test),
- label: `${label}`,
- type: 'cartoon',
- tag: 'polymer'
- }];
- } else if (Array.isArray(selection)) {
- const expression = targetsToExpression(selection);
- return [{
- expression: expression,
- label: `${labelBase}`,
- type: 'ball-and-stick',
- tag: 'polymer'
- }];
- } else {
- throw Error('Unable to handle selection: ' + selection);
- }
- } else {
- return [
- {
- expression: Q.polymer.expression,
- label: `${labelBase} - Polymers`,
- type: 'cartoon',
- tag: 'polymer'
- },
- {
- expression: Q.ligand.expression,
- label: `${labelBase} - Ligands`,
- type: 'ball-and-stick',
- tag: 'ligand'
- },
- {
- expression: Q.ion.expression,
- label: `${labelBase} - Ions`,
- type: 'ball-and-stick',
- tag: 'ion'
- },
- {
- expression: Q.branched.expression,
- label: `${labelBase} - Carbohydrates`,
- type: 'carbohydrate',
- tag: 'branched-snfg-3d'
- },
- {
- expression: Q.lipid.expression,
- label: `${labelBase} - Lipids`,
- type: 'ball-and-stick',
- tag: 'lipid'
- },
- {
- expression: Q.water.expression,
- label: `${labelBase} - Waters`,
- type: 'ball-and-stick',
- tag: 'water'
- }
- ];
- }
- }
- const labelFromProps = (entryId: string, range: Range) => {
- const residues: number[] = (range.label_seq_id) ? toRange(range.label_seq_id.beg, range.label_seq_id.end) : [];
- return entryId + (range.label_asym_id ? `.${range.label_asym_id}` : '') +
- (residues && residues.length > 0 ? `:${residues[0]}` : '') +
- (residues && residues.length > 1 ? `-${residues[residues.length - 1]}` : '');
- };
- export function rangeToTest(asymId: string, residues: number[]) {
- if (residues.length > 0) {
- return {
- 'chain-test': MS.core.rel.eq([MS.ammp('label_asym_id'), asymId]),
- 'residue-test': MS.core.set.has([MS.set(...residues), MS.ammp('label_seq_id')])
- };
- } else {
- return { 'chain-test': MS.core.rel.eq([MS.ammp('label_asym_id'), asymId]) };
- }
- }
- export function targetToLoci(target: Target, structure: Structure): StructureElement.Loci {
- const expression = targetToExpression(target);
- const query = compile<StructureSelection>(expression);
- const selection = query(new QueryContext(structure));
- return StructureSelection.toLociWithSourceUnits(selection);
- }
- function targetsToExpression(targets: Target[]): Expression {
- const expressions = targets.map(t => targetToExpression(t));
- return MS.struct.combinator.merge(expressions);
- }
- function targetToExpression(target: Target): Expression {
- const residueTests: Expression[] = [];
- const chainTests: Expression[] = [];
- const tests: { 'residue-test': Expression, 'chain-test': Expression } = Object.create(null);
- if (target.auth_seq_id) {
- residueTests.push(MS.core.rel.eq([target.auth_seq_id, MS.ammp('auth_seq_id')]));
- } else if (target.label_seq_id) {
- residueTests.push(MS.core.rel.eq([target.label_seq_id, MS.ammp('label_seq_id')]));
- }
- if (target.label_comp_id) {
- residueTests.push(MS.core.rel.eq([target.label_comp_id, MS.ammp('label_comp_id')]));
- }
- if (residueTests.length === 1) {
- tests['residue-test'] = residueTests[0];
- } else if (residueTests.length > 1) {
- tests['residue-test'] = MS.core.logic.and(residueTests);
- }
- if (target.label_asym_id) {
- chainTests.push(MS.core.rel.eq([target.label_asym_id, MS.ammp('label_asym_id')]));
- }
- if (target.operatorName) {
- chainTests.push(MS.core.rel.eq([target.operatorName, MS.acp('operatorName')]));
- }
- if (chainTests.length === 1) {
- tests['chain-test'] = chainTests[0];
- } else if (chainTests.length > 1) {
- tests['chain-test'] = MS.core.logic.and(chainTests);
- }
- if (Object.keys(tests).length > 0) {
- return MS.struct.modifier.union([
- MS.struct.generator.atomGroups(tests)
- ]);
- } else {
- return MS.struct.generator.empty;
- }
- }
|