123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486 |
- /**
- * Copyright (c) 2017 mol* contributors, licensed under MIT, See LICENSE file for more info.
- *
- * @author David Sehnal <david.sehnal@gmail.com>
- */
- import * as B from 'benchmark'
- import * as util from 'util'
- import * as fs from 'fs'
- import fetch from 'node-fetch'
- import CIF from 'mol-io/reader/cif'
- import { Structure, Model, Queries as Q, Element, Selection, StructureSymmetry, Query, Format, StructureProperties as SP } from 'mol-model/structure'
- //import { Segmentation, OrderedSet } from 'mol-data/int'
- import to_mmCIF from 'mol-model/structure/export/mmcif'
- import { Vec3 } from 'mol-math/linear-algebra';
- //import { printUnits } from 'apps/structure-info/model';
- //import { EquivalenceClasses } from 'mol-data/util';
- require('util.promisify').shim();
- const readFileAsync = util.promisify(fs.readFile);
- const writeFileAsync = util.promisify(fs.writeFile);
- async function readData(path: string) {
- if (path.match(/\.bcif$/)) {
- const input = await readFileAsync(path)
- const data = new Uint8Array(input.byteLength);
- for (let i = 0; i < input.byteLength; i++) data[i] = input[i];
- return data;
- } else {
- return readFileAsync(path, 'utf8');
- }
- }
- (Symbol as any).asyncIterator = (Symbol as any).asyncIterator || Symbol.for('Symbol.asyncIterator');
- interface ProgressGenerator<T> extends AsyncIterableIterator<number | T> {
- next(cont?: boolean): Promise<IteratorResult<number | T>>
- }
- async function *test(): ProgressGenerator<boolean> {
- const r = yield await new Promise<number>(res => res(10));
- return r;
- }
- async function runIt(itP: () => ProgressGenerator<boolean>) {
- const it = itP();
- while (true) {
- const { value, done } = await it.next(true);
- if (done) return value;
- }
- }
- runIt(test).then(r => console.log('rerdasdasda', r))
- export async function readCIF(path: string) {
- console.time('readData');
- const input = await readData(path)
- console.timeEnd('readData');
- console.time('parse');
- const comp = typeof input === 'string' ? CIF.parseText(input) : CIF.parseBinary(input);
- const parsed = await comp.run();
- console.timeEnd('parse');
- if (parsed.isError) {
- throw parsed;
- }
- const data = parsed.result.blocks[0];
- console.time('schema')
- const mmcif = Format.mmCIF(data);
- console.timeEnd('schema')
- console.time('buildModels')
- const models = await Model.create(mmcif).run();
- console.timeEnd('buildModels')
- const structures = models.map(Structure.ofModel);
- return { mmcif, models, structures };
- }
- const DATA_DIR = './build/data';
- if (!fs.existsSync(DATA_DIR)) fs.mkdirSync(DATA_DIR);
- function getBcifUrl(pdbId: string) {
- return `http://www.ebi.ac.uk/pdbe/coordinates/${pdbId.toLowerCase()}/full?encoding=bcif`
- }
- function getBcifPath(pdbId: string) {
- return `${DATA_DIR}/${pdbId.toLowerCase()}_full.bcif`
- }
- async function ensureBcifAvailable(pdbId: string) {
- const bcifPath = getBcifPath(pdbId);
- if (!fs.existsSync(bcifPath)) {
- console.log(`downloading ${pdbId} bcif...`)
- const data = await fetch(getBcifUrl(pdbId))
- await writeFileAsync(bcifPath, await data.buffer())
- console.log(`done downloading ${pdbId} bcif`)
- }
- }
- export async function getBcif(pdbId: string) {
- await ensureBcifAvailable(pdbId);
- return await readCIF(getBcifPath(pdbId));
- }
- export namespace PropertyAccess {
- function baseline(model: Model) {
- if (model.sourceData.kind !== 'mmCIF') throw new Error('Model must be mmCIF');
- const atom_site = model.sourceData.data.atom_site;
- const id = atom_site.id.value;
- let s = 0;
- for (let i = 0, _i = atom_site._rowCount; i < _i; i++) {
- s += id(i);
- }
- return s;
- }
- function sumProperty(structure: Structure, p: Element.Property<number>) {
- const l = Element.Location();
- let s = 0;
- for (const unit of structure.units) {
- l.unit = unit;
- const elements = unit.elements;
- for (let j = 0, _j = elements.length; j < _j; j++) {
- l.element = elements[j];
- s += p(l);
- }
- }
- return s;
- }
- // function sumPropertySegmented(structure: Structure, p: Element.Property<number>) {
- // const { elements, units } = structure;
- // const unitIds = ElementSet.unitIndices(elements);
- // const l = Element.Location();
- // let s = 0;
- // let vA = 0, cC = 0, rC = 0;
- // for (let i = 0, _i = unitIds.length; i < _i; i++) {
- // const unit = units[unitIds[i]] as Unit.Atomic;
- // l.unit = unit;
- // const set = ElementSet.groupAt(elements, i);
- // const chainsIt = Segmentation.transientSegments(unit.hierarchy.chainSegments, set.elements);
- // const residues = unit.hierarchy.residueSegments;
- // while (chainsIt.hasNext) {
- // cC++;
- // const chainSegment = chainsIt.move();
- // const residuesIt = Segmentation.transientSegments(residues, set.elements, chainSegment);
- // while (residuesIt.hasNext) {
- // rC++;
- // const residueSegment = residuesIt.move();
- // // l.element= OrdSet.getAt(set, residueSegment.start);
- // // console.log(unit.hierarchy.residues.auth_comp_id.value(unit.residueIndex[l.atom]), l.atom, OrdSet.getAt(set, residueSegment.end))
- // for (let j = residueSegment.start, _j = residueSegment.end; j < _j; j++) {
- // l.element= ElementGroup.getAt(set, j);
- // vA++;
- // s += p(l);
- // }
- // }
- // }
- // }
- // console.log('seg atom count', vA, cC, rC);
- // return s;
- // }
- // function sumPropertyResidue(structure: Structure, p: Element.Property<number>) {
- // const { atoms, units } = structure;
- // const unitIds = ElementSet.unitIds(atoms);
- // const l = Element.Location();
- // let s = 0;
- // for (let i = 0, _i = unitIds.length; i < _i; i++) {
- // const unit = units[unitIds[i]];
- // l.unit = unit;
- // const set = ElementSet.unitGetByIndex(atoms, i);
- // const residuesIt = Segmentation.transientSegments(unit.hierarchy.residueSegments, set.atoms);
- // while (residuesIt.hasNext) {
- // l.element= ElementGroup.getAt(set, residuesIt.move().start);
- // s += p(l);
- // }
- // }
- // return s;
- // }
- // function sumPropertyAtomSetIt(structure: Structure, p: Element.Property<number>) {
- // const { elements, units } = structure;
- // let s = 0;
- // const atomsIt = ElementSet.elements(elements);
- // const l = Element.Location();
- // while (atomsIt.hasNext) {
- // const a = atomsIt.move();
- // l.unit = units[Element.unit(a)];
- // l.element= Element.index(a);
- // s += p(l);
- // }
- // return s;
- // }
- // function sumPropertySegmentedMutable(structure: Structure, p: Property<number>) {
- // const { atoms, units } = structure;
- // const unitIds = ElementSet.unitIds(atoms);
- // const l = Property.createLocation();
- // let s = 0;
- // for (let i = 0, _i = unitIds.length; i < _i; i++) {
- // const unit = units[unitIds[i]];
- // l.unit = unit;
- // const set = ElementSet.unitGetByIndex(atoms, i);
- // const chainsIt = Segmentation.transientSegments(unit.hierarchy.chainSegments, set);
- // const residuesIt = Segmentation.transientSegments(unit.hierarchy.residueSegments, set);
- // while (chainsIt.hasNext) {
- // const chainSegment = chainsIt.move();
- // residuesIt.updateRange(chainSegment);
- // while (residuesIt.hasNext) {
- // const residueSegment = residuesIt.move();
- // for (let j = residueSegment.start, _j = residueSegment.end; j < _j; j++) {
- // l.element= OrdSet.getAt(set, j);
- // s += p(l);
- // }
- // }
- // }
- // }
- // return s;
- // }
- // function sumDirect(structure: Structure) {
- // const { atoms, units } = structure;
- // const unitIds = ElementSet.unitIds(atoms);
- // let s = 0;
- // for (let i = 0, _i = unitIds.length; i < _i; i++) {
- // const unitId = unitIds[i];
- // const unit = units[unitId];
- // const set = ElementSet.unitGetByIndex(atoms, i);
- // //const { residueIndex, chainIndex } = unit;
- // const p = unit.conformation.atomId.value;
- // for (let j = 0, _j = ElementGroup.size(set); j < _j; j++) {
- // const aI = ElementGroup.getAt(set, j);
- // s += p(aI);
- // }
- // }
- // return s;
- // }
- // function concatProperty(structure: Structure, p: Property<string>) {
- // const { atoms, units } = structure;
- // const unitIds = ElementSet.unitIds(atoms);
- // const l = Property.createLocation(structure);
- // let s = [];
- // for (let i = 0, _i = unitIds.length; i < _i; i++) {
- // const unitId = unitIds[i];
- // l.unit = units[unitId];
- // const set = ElementSet.unitGetByIndex(atoms, i);
- // const { residueIndex, chainIndex } = l.unit;
- // for (let j = 0, _j = OrdSet.size(set); j < _j; j++) {
- // const aI = OrdSet.getAt(set, j);
- // l.element= aI;
- // l.residueIndex = residueIndex[aI];
- // l.chainIndex = chainIndex[aI];
- // s[s.length] = p(l);
- // }
- // }
- // return s;
- // }
- export function write(s: Structure) {
- console.log(to_mmCIF('test', s));
- }
- export async function testAssembly(id: string, s: Structure) {
- console.time('assembly')
- const a = await StructureSymmetry.buildAssembly(s, '1').run();
- //const auth_comp_id = SP.residue.auth_comp_id;
- //const q1 = Query(Q.generators.atoms({ residueTest: l => auth_comp_id(l) === 'ALA' }));
- //const alas = await query(q1, a);
- console.timeEnd('assembly')
- fs.writeFileSync(`${DATA_DIR}/${id}_assembly.bcif`, to_mmCIF(id, a, true));
- //fs.writeFileSync(`${DATA_DIR}/${id}_assembly.bcif`, to_mmCIF(id, Selection.unionStructure(alas), true));
- console.log('exported');
- }
- export async function testSymmetry(id: string, s: Structure) {
- console.time('symmetry')
- const a = await StructureSymmetry.buildSymmetryRange(s, Vec3.create(-1, -1, -1), Vec3.create(1, 1, 1)).run();
- //const auth_comp_id = SP.residue.auth_comp_id;
- //const q1 = Query(Q.generators.atoms({ residueTest: l => auth_comp_id(l) === 'ALA' }));
- //const alas = await query(q1, a);
- console.timeEnd('symmetry')
- fs.writeFileSync(`${DATA_DIR}/${id}_symm.bcif`, to_mmCIF(id, a, true));
- //fs.writeFileSync(`${DATA_DIR}/${id}_assembly.bcif`, to_mmCIF(id, Selection.unionStructure(alas), true));
- console.log('exported');
- }
- export async function testIncludeSurroundings(id: string, s: Structure) {
- //const a = s;
- console.time('symmetry')
- const a = await StructureSymmetry.buildSymmetryRange(s, Vec3.create(-2, -2, -2), Vec3.create(2, 2, 2)).run();
- //console.log(printUnits(a));
- const auth_comp_id = SP.residue.auth_comp_id, op = SP.unit.operator_name;
- //const q1 = Q.generators.atoms({ residueTest: l => auth_comp_id(l) === 'REA' });
- const q1 = Q.modifiers.includeSurroundings(Q.generators.atoms({
- chainTest: l => op(l) === '1_555',
- residueTest: l => auth_comp_id(l) === 'REA'
- }), {
- radius: 5,
- wholeResidues: true
- });
- const surr = Selection.unionStructure(await query(Query(q1), a));
- console.timeEnd('symmetry')
- // for (const u of surr.units) {
- // const { atomId } = u.model.atomicConformation;
- // console.log(`${u.id}, ${u.conformation.operator.name}`);
- // for (let i = 0; i < u.elements.length; i++) {
- // console.log(` ${atomId.value(u.elements[i])}`);
- // }
- // }
- // const it = surr.elementLocations();
- // while (it.hasNext) {
- // const e = it.move();
- // console.log(`${SP.unit.operator_name(e)} ${SP.atom.id(e)}`);
- // }
- //fs.writeFileSync(`${DATA_DIR}/${id}_surr.bcif`, to_mmCIF(id, a, true));
- fs.writeFileSync(`${DATA_DIR}/${id}_surr.cif`, to_mmCIF(id, surr, false));
- console.log('exported');
- }
- // export async function testGrouping(structure: Structure) {
- // const { elements, units } = await Run(Symmetry.buildAssembly(structure, '1'));
- // console.log('grouping', units.length);
- // console.log('built asm');
- // const uniqueGroups = EquivalenceClasses<number, { unit: Unit, group: ElementGroup }>(
- // ({ unit, group }) => ElementGroup.hashCode(group),
- // (a, b) => a.unit.model.id === b.unit.model.id && (a.group.key === b.group.key && OrderedSet.areEqual(a.group.elements, b.group.elements))
- // );
- // for (let i = 0, _i = ElementSet.groupCount(elements); i < _i; i++) {
- // const group = ElementSet.groupAt(elements, i);
- // const unitId = ElementSet.groupUnitIndex(elements, i);
- // uniqueGroups.add(unitId, { unit: units[unitId], group });
- // }
- // console.log('group count', uniqueGroups.groups.length);
- // }
- function query(q: Query, s: Structure) {
- return q(s).run();
- }
- export async function run() {
- //const { structures, models/*, mmcif*/ } = await getBcif('1cbs');
- // const { structures, models } = await getBcif('3j3q');
- const { structures, models /*, mmcif*/ } = await readCIF('e:/test/quick/1cbs_updated.cif');
- //const { structures: s1, /*, mmcif*/ } = await readCIF('e:/test/quick/1tqn_updated.cif');
- // testGrouping(structures[0]);
- // console.log('------');
- // testGrouping(s1[0]);
- //const { structures, models/*, mmcif*/ } = await readCIF('e:/test/quick/5j7v_updated.cif');
- //console.log(mmcif.pdbx_struct_oper_list.matrix.toArray());
- // console.log(mmcif.pdbx_struct_oper_list.vector.toArray());
- //await testAssembly('1hrv', structures[0]);
- //await testSymmetry('1cbs', structures[0]);
- await testIncludeSurroundings('1cbs', structures[0]);
- // throw '';
- // console.log(models[0].symmetry.assemblies);
- //const { structures, models } = await readCIF('e:/test/molstar/3j3q.bcif');
- // fs.writeFileSync('e:/test/molstar/3j3q.bcif', to_mmCIF('test', structures[0], true));
- // return;
- // console.log(toMmCIFString('test', structures[0]));
- // return;
- console.log('bs', baseline(models[0]));
- console.log('sp', sumProperty(structures[0], l => l.unit.model.atomicConformation.atomId.value(l.element)));
- //console.log(sumPropertySegmented(structures[0], l => l.unit.model.atomSiteConformation.atomId.value(l.element)));
- //console.log(sumPropertySegmentedMutable(structures[0], l => l.unit.model.conformation.atomId.value(l.element));
- //console.log(sumPropertyAtomSetIt(structures[0], l => l.unit.model.atomSiteConformation.atomId.value(l.element)));
- //console.log(sumProperty(structures[0], Property.cachedAtomColumn(m => m.conformation.atomId)));
- //console.log(sumDirect(structures[0]));
- //console.log('r', sumPropertyResidue(structures[0], l => l.unit.hierarchy.residues.auth_seq_id.value(l.unit.residueIndex[l.atom])));
- console.time('atom.x');
- console.log('atom.x', sumProperty(structures[0], SP.atom.x));
- console.timeEnd('atom.x');
- console.time('__x')
- //console.log('__x', sumProperty(structures[0], l => l.unit.conformation.x[l.atom]));
- console.timeEnd('__x')
- //const authSeqId = Element.property(l => l.unit.hierarchy.residues.auth_seq_id.value(l.unit.residueIndex[l.atom]));
- //const auth_seq_id = SP.residue.auth_seq_id;
- const auth_comp_id = SP.residue.auth_comp_id;
- //const auth_asym_id = SP.chain.auth_asym_id;
- //const set = new Set(['A', 'B', 'C', 'D']);
- //const q = Q.generators.atomGroups({ atomTest: l => auth_seq_id(l) < 3 });
- const q = Query(Q.generators.atoms({ atomTest: Q.pred.eq(SP.residue.auth_comp_id, 'ALA') }));
- const P = SP
- //const q0 = Q.generators.atoms({ atomTest: l => auth_comp_id(l) === 'ALA' });
- const q1 = Query(Q.generators.atoms({ residueTest: l => auth_comp_id(l) === 'ALA' }));
- const q2 = Query(Q.generators.atoms({ residueTest: l => auth_comp_id(l) === 'ALA', groupBy: SP.residue.key }));
- const q3 = Query(Q.generators.atoms({
- chainTest: Q.pred.inSet(P.chain.auth_asym_id, ['A', 'B', 'C', 'D']),
- residueTest: Q.pred.eq(P.residue.auth_comp_id, 'ALA')
- }));
- await query(q, structures[0]);
- //console.log(to_mmCIF('test', Selection.union(q0r)));
- console.time('q1')
- await query(q1, structures[0]);
- console.timeEnd('q1')
- console.time('q1')
- await query(q1, structures[0]);
- console.timeEnd('q1')
- console.time('q2')
- const q2r = await query(q2, structures[0]);
- console.timeEnd('q2')
- console.log(Selection.structureCount(q2r));
- //console.log(q1(structures[0]));
- const col = models[0].atomicConformation.atomId.value;
- const suite = new B.Suite();
- suite
- //.add('test q', () => q1(structures[0]))
- //.add('test q', () => q(structures[0]))
- .add('test int', () => sumProperty(structures[0], l => col(l.element)))
- .add('test q1', async () => await query(q1, structures[0]))
- .add('test q3', async () => await query(q3, structures[0]))
- // .add('sum residue', () => sumPropertyResidue(structures[0], l => l.unit.hierarchy.residues.auth_seq_id.value(l.unit.residueIndex[l.atom])))
- // .add('baseline', () => baseline(models[0]))
- // .add('direct', () => sumDirect(structures[0]))
- //.add('normal int', () => sumProperty(structures[0], l => l.unit.model.conformation.atomId.value(l.element))
- //.add('atom set it int', () => sumPropertyAtomSetIt(structures[0], l => l.unit.conformation.atomId.value(l.element))
- // .add('segmented faster int', () => sumPropertySegmented(structures[0], l => l.unit.conformation.atomId.value(l.element))
- // .add('faster int', () => sumProperty(structures[0], l => l.unit.conformation.atomId.value(l.element))
- //.add('segmented faster _x', () => sumPropertySegmented(structures[0], l => l.unit.conformation.__x[l.atom]))
- //.add('faster _x', () => sumProperty(structures[0], l => l.unit.conformation.__x[l.atom] + l.unit.conformation.__y[l.atom] + l.unit.conformation.__z[l.atom]))
- //.add('segmented mut faster int', () => sumPropertySegmentedMutable(structures[0], l => l.unit.conformation.atomId.value(l.element))
- //.add('normal shortcut int', () => sumProperty(structures[0], l => l.conformation.atomId.value(l.element))
- //.add('cached int', () => sumProperty(structures[0], Property.cachedAtomColumn(m => m.conformation.atomId)))
- //.add('concat str', () => concatProperty(structures[0], l => l.unit.model.hierarchy.atoms.auth_atom_id.value(l.element))
- //.add('cached concat str', () => concatProperty(structures[0], Property.cachedAtomColumn(m => m.hierarchy.atoms.auth_atom_id)))
- .on('cycle', (e: any) => console.log(String(e.target)))
- .run();
- }
- }
- PropertyAccess.run();
|